mirror of https://github.com/cemu-project/Cemu.git
Misc. Linux improvements and bug fixes. (#121)
Co-authored-by: Tom Lally <tomlally@protonmail.com>
This commit is contained in:
parent
b8d4cf5b29
commit
d3a7b3b5a6
|
@ -28,15 +28,13 @@ elseif(UNIX)
|
||||||
add_definitions(-DVK_USE_PLATFORM_XLIB_KHR) # legacy. Do we need to support XLIB surfaces?
|
add_definitions(-DVK_USE_PLATFORM_XLIB_KHR) # legacy. Do we need to support XLIB surfaces?
|
||||||
add_definitions(-DVK_USE_PLATFORM_XCB_KHR)
|
add_definitions(-DVK_USE_PLATFORM_XCB_KHR)
|
||||||
endif()
|
endif()
|
||||||
add_definitions(-fms-extensions)
|
|
||||||
add_definitions(-fpermissive)
|
|
||||||
add_definitions(-maes)
|
add_definitions(-maes)
|
||||||
# warnings
|
# warnings
|
||||||
if(CMAKE_C_COMPILER_ID MATCHES "Clang")
|
if(CMAKE_C_COMPILER_ID MATCHES "Clang")
|
||||||
add_compile_options(-Wno-ambiguous-reversed-operator)
|
add_compile_options(-Wno-ambiguous-reversed-operator)
|
||||||
endif()
|
endif()
|
||||||
|
|
||||||
add_compile_options(-Wno-switch -Wno-ignored-attributes -Wno-deprecated-enum-enum-conversion)
|
add_compile_options(-Wno-multichar -Wno-invalid-offsetof -Wno-switch -Wno-ignored-attributes -Wno-deprecated-enum-enum-conversion)
|
||||||
endif()
|
endif()
|
||||||
|
|
||||||
add_definitions(-DVK_NO_PROTOTYPES)
|
add_definitions(-DVK_NO_PROTOTYPES)
|
||||||
|
|
|
@ -1,6 +1,6 @@
|
||||||
project(CemuCafe)
|
project(CemuCafe)
|
||||||
|
|
||||||
if((CMAKE_C_COMPILER_ID STREQUAL "GNU") OR (CMAKE_C_COMPILER_ID STREQUAL "Clang"))
|
if(CMAKE_C_COMPILER_ID STREQUAL "GNU")
|
||||||
add_compile_options(-mssse3 -mavx2)
|
add_compile_options(-mssse3 -mavx2)
|
||||||
endif()
|
endif()
|
||||||
|
|
||||||
|
|
|
@ -40,5 +40,4 @@ namespace CafeSystem
|
||||||
|
|
||||||
extern RPLModule* applicationRPX;
|
extern RPLModule* applicationRPX;
|
||||||
|
|
||||||
extern std::atomic_bool g_isGameRunning;
|
|
||||||
extern std::atomic_bool g_isGPUInitFinished;
|
extern std::atomic_bool g_isGPUInitFinished;
|
||||||
|
|
|
@ -11,7 +11,7 @@ static uint32 ppc_cmp_and_mask[8] = {
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
||||||
#define ppc_word_rotl(_data, _n) (_rotl(_data,(_n)&0x1F))
|
#define ppc_word_rotl(_data, _n) (std::rotl<uint32>(_data,(_n)&0x1F))
|
||||||
|
|
||||||
static inline uint32 ppc_mask(int MB, int ME)
|
static inline uint32 ppc_mask(int MB, int ME)
|
||||||
{
|
{
|
||||||
|
|
|
@ -32,7 +32,7 @@ uint64 muldiv64(uint64 a, uint64 b, uint64 d)
|
||||||
bool PPCTimer_hasInvariantRDTSCSupport()
|
bool PPCTimer_hasInvariantRDTSCSupport()
|
||||||
{
|
{
|
||||||
uint32 cpuv[4];
|
uint32 cpuv[4];
|
||||||
__cpuid((int*)cpuv, 0x80000007);
|
cpuid((int*)cpuv, 0x80000007);
|
||||||
return ((cpuv[3] >> 8) & 1);
|
return ((cpuv[3] >> 8) & 1);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -106,11 +106,7 @@ uint64 PPCTimer_microsecondsToTsc(uint64 us)
|
||||||
uint64 PPCTimer_tscToMicroseconds(uint64 us)
|
uint64 PPCTimer_tscToMicroseconds(uint64 us)
|
||||||
{
|
{
|
||||||
uint128_t r{};
|
uint128_t r{};
|
||||||
#if BOOST_OS_WINDOWS
|
|
||||||
r.low = _umul128(us, 1000000ULL, &r.high);
|
r.low = _umul128(us, 1000000ULL, &r.high);
|
||||||
#else
|
|
||||||
r.low = _umul128(us, 1000000ULL, (unsigned long long*)&r.high);
|
|
||||||
#endif
|
|
||||||
|
|
||||||
|
|
||||||
uint64 remainder;
|
uint64 remainder;
|
||||||
|
@ -146,11 +142,7 @@ uint64 PPCTimer_getFromRDTSC()
|
||||||
rdtscDif = rdtscDif & ~(uint64)((sint64)rdtscDif >> 63);
|
rdtscDif = rdtscDif & ~(uint64)((sint64)rdtscDif >> 63);
|
||||||
|
|
||||||
uint128_t diff{};
|
uint128_t diff{};
|
||||||
#if BOOST_OS_WINDOWS
|
|
||||||
diff.low = _umul128(rdtscDif, Espresso::CORE_CLOCK, &diff.high);
|
diff.low = _umul128(rdtscDif, Espresso::CORE_CLOCK, &diff.high);
|
||||||
#else
|
|
||||||
diff.low = _umul128(rdtscDif, Espresso::CORE_CLOCK, (unsigned long long*)&diff.high);
|
|
||||||
#endif
|
|
||||||
|
|
||||||
if(rdtscCurrentMeasure > _rdtscLastMeasure)
|
if(rdtscCurrentMeasure > _rdtscLastMeasure)
|
||||||
_rdtscLastMeasure = rdtscCurrentMeasure; // only travel forward in time
|
_rdtscLastMeasure = rdtscCurrentMeasure; // only travel forward in time
|
||||||
|
|
|
@ -575,12 +575,12 @@ void PPCRecompiler_init()
|
||||||
|
|
||||||
// query processor extensions
|
// query processor extensions
|
||||||
int cpuInfo[4];
|
int cpuInfo[4];
|
||||||
__cpuid(cpuInfo, 0x80000001);
|
cpuid(cpuInfo, 0x80000001);
|
||||||
hasLZCNTSupport = ((cpuInfo[2] >> 5) & 1) != 0;
|
hasLZCNTSupport = ((cpuInfo[2] >> 5) & 1) != 0;
|
||||||
__cpuid(cpuInfo, 0x1);
|
cpuid(cpuInfo, 0x1);
|
||||||
hasMOVBESupport = ((cpuInfo[2] >> 22) & 1) != 0;
|
hasMOVBESupport = ((cpuInfo[2] >> 22) & 1) != 0;
|
||||||
hasAVXSupport = ((cpuInfo[2] >> 28) & 1) != 0;
|
hasAVXSupport = ((cpuInfo[2] >> 28) & 1) != 0;
|
||||||
__cpuidex(cpuInfo, 0x7, 0);
|
cpuidex(cpuInfo, 0x7, 0);
|
||||||
hasBMI2Support = ((cpuInfo[1] >> 8) & 1) != 0;
|
hasBMI2Support = ((cpuInfo[1] >> 8) & 1) != 0;
|
||||||
|
|
||||||
forceLog_printf("Recompiler initialized. CPU extensions: %s%s%s", hasLZCNTSupport ? "LZCNT " : "", hasMOVBESupport ? "MOVBE " : "", hasAVXSupport ? "AVX " : "");
|
forceLog_printf("Recompiler initialized. CPU extensions: %s%s%s", hasLZCNTSupport ? "LZCNT " : "", hasMOVBESupport ? "MOVBE " : "", hasAVXSupport ? "AVX " : "");
|
||||||
|
|
|
@ -81,31 +81,31 @@ void LatteShader_calculateFSKey(LatteFetchShader* fetchShader)
|
||||||
{
|
{
|
||||||
LatteParsedFetchShaderAttribute_t* attrib = group.attrib + f;
|
LatteParsedFetchShaderAttribute_t* attrib = group.attrib + f;
|
||||||
key += (uint64)attrib->endianSwap;
|
key += (uint64)attrib->endianSwap;
|
||||||
key = std::rotl(key, 3);
|
key = std::rotl<uint64>(key, 3);
|
||||||
key += (uint64)attrib->nfa;
|
key += (uint64)attrib->nfa;
|
||||||
key = std::rotl(key, 3);
|
key = std::rotl<uint64>(key, 3);
|
||||||
key += (uint64)(attrib->isSigned?1:0);
|
key += (uint64)(attrib->isSigned?1:0);
|
||||||
key = std::rotl(key, 1);
|
key = std::rotl<uint64>(key, 1);
|
||||||
key += (uint64)attrib->format;
|
key += (uint64)attrib->format;
|
||||||
key = std::rotl(key, 7);
|
key = std::rotl<uint64>(key, 7);
|
||||||
key += (uint64)attrib->fetchType;
|
key += (uint64)attrib->fetchType;
|
||||||
key = std::rotl(key, 8);
|
key = std::rotl<uint64>(key, 8);
|
||||||
key += (uint64)attrib->ds[0];
|
key += (uint64)attrib->ds[0];
|
||||||
key = std::rotl(key, 2);
|
key = std::rotl<uint64>(key, 2);
|
||||||
key += (uint64)attrib->ds[1];
|
key += (uint64)attrib->ds[1];
|
||||||
key = std::rotl(key, 2);
|
key = std::rotl<uint64>(key, 2);
|
||||||
key += (uint64)attrib->ds[2];
|
key += (uint64)attrib->ds[2];
|
||||||
key = std::rotl(key, 2);
|
key = std::rotl<uint64>(key, 2);
|
||||||
key += (uint64)attrib->ds[3];
|
key += (uint64)attrib->ds[3];
|
||||||
key = std::rotl(key, 2);
|
key = std::rotl<uint64>(key, 2);
|
||||||
key += (uint64)(attrib->aluDivisor+1);
|
key += (uint64)(attrib->aluDivisor+1);
|
||||||
key = std::rotl(key, 2);
|
key = std::rotl<uint64>(key, 2);
|
||||||
key += (uint64)attrib->attributeBufferIndex;
|
key += (uint64)attrib->attributeBufferIndex;
|
||||||
key = std::rotl(key, 8);
|
key = std::rotl<uint64>(key, 8);
|
||||||
key += (uint64)attrib->semanticId;
|
key += (uint64)attrib->semanticId;
|
||||||
key = std::rotl(key, 8);
|
key = std::rotl<uint64>(key, 8);
|
||||||
key += (uint64)(attrib->offset & 3);
|
key += (uint64)(attrib->offset & 3);
|
||||||
key = std::rotl(key, 2);
|
key = std::rotl<uint64>(key, 2);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
// todo - also hash invalid buffer groups?
|
// todo - also hash invalid buffer groups?
|
||||||
|
|
|
@ -743,7 +743,7 @@ private:
|
||||||
//h ^= *memU64;
|
//h ^= *memU64;
|
||||||
//memU64++;
|
//memU64++;
|
||||||
|
|
||||||
h = std::rotr(h, 7);
|
h = std::rotr<uint64>(h, 7);
|
||||||
h += (*memU64 + (uint64)i);
|
h += (*memU64 + (uint64)i);
|
||||||
memU64++;
|
memU64++;
|
||||||
}
|
}
|
||||||
|
|
|
@ -158,15 +158,15 @@ void LatteMRT::ApplyCurrentState()
|
||||||
if (colorView)
|
if (colorView)
|
||||||
{
|
{
|
||||||
key += ((uint64)colorView);
|
key += ((uint64)colorView);
|
||||||
key = std::rotl(key, 5);
|
key = std::rotl<uint64>(key, 5);
|
||||||
fboLookupView = colorView;
|
fboLookupView = colorView;
|
||||||
}
|
}
|
||||||
key = std::rotl(key, 7);
|
key = std::rotl<uint64>(key, 7);
|
||||||
}
|
}
|
||||||
if (sLatteCurrentRendertargets.depthBuffer.view)
|
if (sLatteCurrentRendertargets.depthBuffer.view)
|
||||||
{
|
{
|
||||||
key += ((uint64)sLatteCurrentRendertargets.depthBuffer.view);
|
key += ((uint64)sLatteCurrentRendertargets.depthBuffer.view);
|
||||||
key = std::rotl(key, 5);
|
key = std::rotl<uint64>(key, 5);
|
||||||
key += (sLatteCurrentRendertargets.depthBuffer.hasStencil);
|
key += (sLatteCurrentRendertargets.depthBuffer.hasStencil);
|
||||||
if (fboLookupView == NULL)
|
if (fboLookupView == NULL)
|
||||||
{
|
{
|
||||||
|
|
|
@ -263,7 +263,7 @@ void LatteShader_UpdatePSInputs(uint32* contextRegisters)
|
||||||
cemu_assert_debug(psSemanticId != 0xFF);
|
cemu_assert_debug(psSemanticId != 0xFF);
|
||||||
|
|
||||||
key += (uint64)psInputControl;
|
key += (uint64)psInputControl;
|
||||||
key = std::rotl(key, 7);
|
key = std::rotl<uint64>(key, 7);
|
||||||
if (spi0_positionEnable && f == spi0_positionAddr)
|
if (spi0_positionEnable && f == spi0_positionAddr)
|
||||||
{
|
{
|
||||||
_activePSImportTable.import[f].semanticId = LATTE_ANALYZER_IMPORT_INDEX_SPIPOSITION;
|
_activePSImportTable.import[f].semanticId = LATTE_ANALYZER_IMPORT_INDEX_SPIPOSITION;
|
||||||
|
@ -546,7 +546,7 @@ uint64 LatteSHRC_CalcVSAuxHash(LatteDecompilerShader* vertexShader, uint32* cont
|
||||||
if(!vertexShader->streamoutBufferWriteMask2[i])
|
if(!vertexShader->streamoutBufferWriteMask2[i])
|
||||||
continue;
|
continue;
|
||||||
uint32 bufferStride = contextRegisters[mmVGT_STRMOUT_VTX_STRIDE_0 + i * 4];
|
uint32 bufferStride = contextRegisters[mmVGT_STRMOUT_VTX_STRIDE_0 + i * 4];
|
||||||
auxHash = std::rotl(auxHash, 7);
|
auxHash = std::rotl<uint64>(auxHash, 7);
|
||||||
auxHash += (uint64)bufferStride;
|
auxHash += (uint64)bufferStride;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -559,7 +559,7 @@ uint64 LatteSHRC_CalcVSAuxHash(LatteDecompilerShader* vertexShader, uint32* cont
|
||||||
if ((word4 & 0x300) == 0x100)
|
if ((word4 & 0x300) == 0x100)
|
||||||
{
|
{
|
||||||
// integer format
|
// integer format
|
||||||
auxHashTex = std::rotl(auxHashTex, 7);
|
auxHashTex = std::rotl<uint64>(auxHashTex, 7);
|
||||||
auxHashTex += 0x333;
|
auxHashTex += 0x333;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -984,7 +984,7 @@ float get_##__regname() const \
|
||||||
SRF_MODE_NO_ZERO = 1,
|
SRF_MODE_NO_ZERO = 1,
|
||||||
};
|
};
|
||||||
|
|
||||||
using E_ENDIAN_SWAP = E_ENDIAN_SWAP;
|
// using E_ENDIAN_SWAP = E_ENDIAN_SWAP;
|
||||||
|
|
||||||
enum class E_SEL
|
enum class E_SEL
|
||||||
{
|
{
|
||||||
|
|
|
@ -44,9 +44,9 @@ void OpenGLRenderer::uniformData_update()
|
||||||
for (sint32 f = 0; f < remappedArraySize; f++)
|
for (sint32 f = 0; f < remappedArraySize; f++)
|
||||||
{
|
{
|
||||||
uniformDataHash[0] ^= remappedUniformData64[0];
|
uniformDataHash[0] ^= remappedUniformData64[0];
|
||||||
uniformDataHash[0] = std::rotl(uniformDataHash[0], 11);
|
uniformDataHash[0] = std::rotl<uint64>(uniformDataHash[0], 11);
|
||||||
uniformDataHash[1] ^= remappedUniformData64[1];
|
uniformDataHash[1] ^= remappedUniformData64[1];
|
||||||
uniformDataHash[1] = std::rotl(uniformDataHash[1], 11);
|
uniformDataHash[1] = std::rotl<uint64>(uniformDataHash[1], 11);
|
||||||
remappedUniformData64 += 2;
|
remappedUniformData64 += 2;
|
||||||
}
|
}
|
||||||
if (shader->uniformDataHash64[0] != uniformDataHash[0] || shader->uniformDataHash64[1] != uniformDataHash[1])
|
if (shader->uniformDataHash64[0] != uniformDataHash[0] || shader->uniformDataHash64[1] != uniformDataHash[1])
|
||||||
|
|
|
@ -8,7 +8,7 @@ uint32 RendererShader::GeneratePrecompiledCacheId()
|
||||||
const char* s = EMULATOR_VERSION_SUFFIX;
|
const char* s = EMULATOR_VERSION_SUFFIX;
|
||||||
while (*s)
|
while (*s)
|
||||||
{
|
{
|
||||||
v = _rotl(v, 7);
|
v = std::rotl<uint32>(v, 7);
|
||||||
v += (uint32)(*s);
|
v += (uint32)(*s);
|
||||||
s++;
|
s++;
|
||||||
}
|
}
|
||||||
|
|
|
@ -4050,13 +4050,13 @@ VKRObjectRenderPass::VKRObjectRenderPass(AttachmentInfo_t& attachmentInfo, sint3
|
||||||
if (attachmentInfo.colorAttachment[i].isPresent || attachmentInfo.colorAttachment[i].viewObj)
|
if (attachmentInfo.colorAttachment[i].isPresent || attachmentInfo.colorAttachment[i].viewObj)
|
||||||
{
|
{
|
||||||
stateHash += attachmentInfo.colorAttachment[i].format + i * 31;
|
stateHash += attachmentInfo.colorAttachment[i].format + i * 31;
|
||||||
stateHash = std::rotl(stateHash, 7);
|
stateHash = std::rotl<uint64>(stateHash, 7);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if (attachmentInfo.depthAttachment.isPresent || attachmentInfo.depthAttachment.viewObj)
|
if (attachmentInfo.depthAttachment.isPresent || attachmentInfo.depthAttachment.viewObj)
|
||||||
{
|
{
|
||||||
stateHash += attachmentInfo.depthAttachment.format;
|
stateHash += attachmentInfo.depthAttachment.format;
|
||||||
stateHash = std::rotl(stateHash, 7);
|
stateHash = std::rotl<uint64>(stateHash, 7);
|
||||||
}
|
}
|
||||||
m_hashForPipeline = stateHash;
|
m_hashForPipeline = stateHash;
|
||||||
|
|
||||||
|
|
|
@ -24,18 +24,18 @@ uint64 VulkanRenderer::draw_calculateMinimalGraphicsPipelineHash(const LatteFetc
|
||||||
for (auto& group : fetchShader->bufferGroups)
|
for (auto& group : fetchShader->bufferGroups)
|
||||||
{
|
{
|
||||||
uint32 bufferStride = group.getCurrentBufferStride(lcr.GetRawView());
|
uint32 bufferStride = group.getCurrentBufferStride(lcr.GetRawView());
|
||||||
stateHash = std::rotl(stateHash, 7);
|
stateHash = std::rotl<uint64>(stateHash, 7);
|
||||||
stateHash += bufferStride * 3;
|
stateHash += bufferStride * 3;
|
||||||
}
|
}
|
||||||
|
|
||||||
stateHash += fetchShader->getVkPipelineHashFragment();
|
stateHash += fetchShader->getVkPipelineHashFragment();
|
||||||
stateHash = std::rotl(stateHash, 7);
|
stateHash = std::rotl<uint64>(stateHash, 7);
|
||||||
|
|
||||||
stateHash += lcr.GetRawView()[mmVGT_PRIMITIVE_TYPE];
|
stateHash += lcr.GetRawView()[mmVGT_PRIMITIVE_TYPE];
|
||||||
stateHash = std::rotl(stateHash, 7);
|
stateHash = std::rotl<uint64>(stateHash, 7);
|
||||||
|
|
||||||
stateHash += lcr.GetRawView()[mmVGT_STRMOUT_EN];
|
stateHash += lcr.GetRawView()[mmVGT_STRMOUT_EN];
|
||||||
stateHash = std::rotl(stateHash, 7);
|
stateHash = std::rotl<uint64>(stateHash, 7);
|
||||||
|
|
||||||
if(lcr.PA_CL_CLIP_CNTL.get_DX_RASTERIZATION_KILL())
|
if(lcr.PA_CL_CLIP_CNTL.get_DX_RASTERIZATION_KILL())
|
||||||
stateHash += 0x333333;
|
stateHash += 0x333333;
|
||||||
|
@ -66,24 +66,24 @@ uint64 VulkanRenderer::draw_calculateGraphicsPipelineHash(const LatteFetchShader
|
||||||
if (vertexShader)
|
if (vertexShader)
|
||||||
stateHash += vertexShader->baseHash;
|
stateHash += vertexShader->baseHash;
|
||||||
|
|
||||||
stateHash = std::rotl(stateHash, 13);
|
stateHash = std::rotl<uint64>(stateHash, 13);
|
||||||
|
|
||||||
if (geometryShader)
|
if (geometryShader)
|
||||||
stateHash += geometryShader->baseHash;
|
stateHash += geometryShader->baseHash;
|
||||||
|
|
||||||
stateHash = std::rotl(stateHash, 13);
|
stateHash = std::rotl<uint64>(stateHash, 13);
|
||||||
|
|
||||||
if (pixelShader)
|
if (pixelShader)
|
||||||
stateHash += pixelShader->baseHash + pixelShader->auxHash;
|
stateHash += pixelShader->baseHash + pixelShader->auxHash;
|
||||||
|
|
||||||
stateHash = std::rotl(stateHash, 13);
|
stateHash = std::rotl<uint64>(stateHash, 13);
|
||||||
|
|
||||||
uint32 polygonCtrl = lcr.PA_SU_SC_MODE_CNTL.getRawValue();
|
uint32 polygonCtrl = lcr.PA_SU_SC_MODE_CNTL.getRawValue();
|
||||||
stateHash += polygonCtrl;
|
stateHash += polygonCtrl;
|
||||||
stateHash = std::rotl(stateHash, 7);
|
stateHash = std::rotl<uint64>(stateHash, 7);
|
||||||
|
|
||||||
stateHash += ctxRegister[Latte::REGADDR::PA_CL_CLIP_CNTL];
|
stateHash += ctxRegister[Latte::REGADDR::PA_CL_CLIP_CNTL];
|
||||||
stateHash = std::rotl(stateHash, 7);
|
stateHash = std::rotl<uint64>(stateHash, 7);
|
||||||
|
|
||||||
const auto colorControlReg = ctxRegister[Latte::REGADDR::CB_COLOR_CONTROL];
|
const auto colorControlReg = ctxRegister[Latte::REGADDR::CB_COLOR_CONTROL];
|
||||||
stateHash += colorControlReg;
|
stateHash += colorControlReg;
|
||||||
|
@ -97,7 +97,7 @@ uint64 VulkanRenderer::draw_calculateGraphicsPipelineHash(const LatteFetchShader
|
||||||
{
|
{
|
||||||
if (((blendEnableMask & (1 << i))) == 0)
|
if (((blendEnableMask & (1 << i))) == 0)
|
||||||
continue;
|
continue;
|
||||||
stateHash = std::rotl(stateHash, 7);
|
stateHash = std::rotl<uint64>(stateHash, 7);
|
||||||
stateHash += ctxRegister[Latte::REGADDR::CB_BLEND0_CONTROL + i];
|
stateHash += ctxRegister[Latte::REGADDR::CB_BLEND0_CONTROL + i];
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -109,11 +109,11 @@ uint64 VulkanRenderer::draw_calculateGraphicsPipelineHash(const LatteFetchShader
|
||||||
if (stencilTestEnable)
|
if (stencilTestEnable)
|
||||||
{
|
{
|
||||||
stateHash += ctxRegister[mmDB_STENCILREFMASK];
|
stateHash += ctxRegister[mmDB_STENCILREFMASK];
|
||||||
stateHash = std::rotl(stateHash, 17);
|
stateHash = std::rotl<uint64>(stateHash, 17);
|
||||||
if(depthControl & (1<<7)) // back stencil enable
|
if(depthControl & (1<<7)) // back stencil enable
|
||||||
{
|
{
|
||||||
stateHash += ctxRegister[mmDB_STENCILREFMASK_BF];
|
stateHash += ctxRegister[mmDB_STENCILREFMASK_BF];
|
||||||
stateHash = std::rotl(stateHash, 13);
|
stateHash = std::rotl<uint64>(stateHash, 13);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
|
@ -122,7 +122,7 @@ uint64 VulkanRenderer::draw_calculateGraphicsPipelineHash(const LatteFetchShader
|
||||||
depthControl &= 0xFF;
|
depthControl &= 0xFF;
|
||||||
}
|
}
|
||||||
|
|
||||||
stateHash = std::rotl(stateHash, 17);
|
stateHash = std::rotl<uint64>(stateHash, 17);
|
||||||
stateHash += depthControl;
|
stateHash += depthControl;
|
||||||
|
|
||||||
// polygon offset
|
// polygon offset
|
||||||
|
@ -542,16 +542,16 @@ uint64 VulkanRenderer::GetDescriptorSetStateHash(LatteDecompilerShader* shader)
|
||||||
{
|
{
|
||||||
samplerIndex += LatteDecompiler_getTextureSamplerBaseIndex(shader->shaderType);
|
samplerIndex += LatteDecompiler_getTextureSamplerBaseIndex(shader->shaderType);
|
||||||
hash += LatteGPUState.contextRegister[Latte::REGADDR::SQ_TEX_SAMPLER_WORD0_0 + samplerIndex * 3 + 0];
|
hash += LatteGPUState.contextRegister[Latte::REGADDR::SQ_TEX_SAMPLER_WORD0_0 + samplerIndex * 3 + 0];
|
||||||
hash = std::rotl(hash, 7);
|
hash = std::rotl<uint64>(hash, 7);
|
||||||
hash += LatteGPUState.contextRegister[Latte::REGADDR::SQ_TEX_SAMPLER_WORD0_0 + samplerIndex * 3 + 1];
|
hash += LatteGPUState.contextRegister[Latte::REGADDR::SQ_TEX_SAMPLER_WORD0_0 + samplerIndex * 3 + 1];
|
||||||
hash = std::rotl(hash, 7);
|
hash = std::rotl<uint64>(hash, 7);
|
||||||
hash += LatteGPUState.contextRegister[Latte::REGADDR::SQ_TEX_SAMPLER_WORD0_0 + samplerIndex * 3 + 2];
|
hash += LatteGPUState.contextRegister[Latte::REGADDR::SQ_TEX_SAMPLER_WORD0_0 + samplerIndex * 3 + 2];
|
||||||
hash = std::rotl(hash, 7);
|
hash = std::rotl<uint64>(hash, 7);
|
||||||
}
|
}
|
||||||
hash = std::rotl(hash, 7);
|
hash = std::rotl<uint64>(hash, 7);
|
||||||
// hash view id + swizzle mask
|
// hash view id + swizzle mask
|
||||||
hash += (uint64)texture->GetUniqueId();
|
hash += (uint64)texture->GetUniqueId();
|
||||||
hash = std::rotr(hash, 21);
|
hash = std::rotr<uint64>(hash, 21);
|
||||||
hash += (uint64)(word4 & 0x0FFF0000);
|
hash += (uint64)(word4 & 0x0FFF0000);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -108,12 +108,12 @@ uint64 VulkanRenderer::copySurface_getPipelineStateHash(VkCopySurfaceState_t& st
|
||||||
uint64 h = 0;
|
uint64 h = 0;
|
||||||
|
|
||||||
h += (uintptr_t)state.destinationTexture->GetFormat();
|
h += (uintptr_t)state.destinationTexture->GetFormat();
|
||||||
h = std::rotr(h, 7);
|
h = std::rotr<uint64>(h, 7);
|
||||||
|
|
||||||
h += state.sourceTexture->isDepth ? 0x1111ull : 0;
|
h += state.sourceTexture->isDepth ? 0x1111ull : 0;
|
||||||
h = std::rotr(h, 7);
|
h = std::rotr<uint64>(h, 7);
|
||||||
h += state.destinationTexture->isDepth ? 0x1112ull : 0;
|
h += state.destinationTexture->isDepth ? 0x1112ull : 0;
|
||||||
h = std::rotr(h, 7);
|
h = std::rotr<uint64>(h, 7);
|
||||||
|
|
||||||
return h;
|
return h;
|
||||||
}
|
}
|
||||||
|
|
|
@ -563,10 +563,10 @@ int iosuAct_thread()
|
||||||
|
|
||||||
uint32 name = (uint32)actCemuRequest->uuidName;
|
uint32 name = (uint32)actCemuRequest->uuidName;
|
||||||
uint8 tempArray[] = {
|
uint8 tempArray[] = {
|
||||||
(name >> 24) & 0xFF,
|
static_cast<uint8>((name >> 24) & 0xFF),
|
||||||
(name >> 16) & 0xFF,
|
static_cast<uint8>((name >> 16) & 0xFF),
|
||||||
(name >> 8) & 0xFF,
|
static_cast<uint8>((name >> 8) & 0xFF),
|
||||||
(name >> 0) & 0xFF,
|
static_cast<uint8>((name >> 0) & 0xFF),
|
||||||
0x3A,
|
0x3A,
|
||||||
0x27,
|
0x27,
|
||||||
0x5E,
|
0x5E,
|
||||||
|
|
|
@ -713,8 +713,8 @@ void _calculateMappedImportNameHash(const char* rplName, const char* funcName, u
|
||||||
uint64 v = (uint64)*rplName;
|
uint64 v = (uint64)*rplName;
|
||||||
h1 += v;
|
h1 += v;
|
||||||
h2 ^= v;
|
h2 ^= v;
|
||||||
h1 = std::rotl(h1, 3);
|
h1 = std::rotl<uint64>(h1, 3);
|
||||||
h2 = std::rotl(h2, 7);
|
h2 = std::rotl<uint64>(h2, 7);
|
||||||
rplName++;
|
rplName++;
|
||||||
}
|
}
|
||||||
// funcName
|
// funcName
|
||||||
|
@ -723,8 +723,8 @@ void _calculateMappedImportNameHash(const char* rplName, const char* funcName, u
|
||||||
uint64 v = (uint64)*funcName;
|
uint64 v = (uint64)*funcName;
|
||||||
h1 += v;
|
h1 += v;
|
||||||
h2 ^= v;
|
h2 ^= v;
|
||||||
h1 = std::rotl(h1, 3);
|
h1 = std::rotl<uint64>(h1, 3);
|
||||||
h2 = std::rotl(h2, 7);
|
h2 = std::rotl<uint64>(h2, 7);
|
||||||
funcName++;
|
funcName++;
|
||||||
}
|
}
|
||||||
*h1Out = h1;
|
*h1Out = h1;
|
||||||
|
|
|
@ -228,11 +228,39 @@ typedef union _LARGE_INTEGER {
|
||||||
#if defined(_MSC_VER)
|
#if defined(_MSC_VER)
|
||||||
#define DLLEXPORT __declspec(dllexport)
|
#define DLLEXPORT __declspec(dllexport)
|
||||||
#elif defined(__GNUC__)
|
#elif defined(__GNUC__)
|
||||||
#define DLLEXPORT __attribute__((dllexport))
|
#if BOOST_OS_WINDOWS
|
||||||
|
#define DLLEXPORT __attribute__((dllexport))
|
||||||
|
#else
|
||||||
|
#define DLLEXPORT
|
||||||
|
#endif
|
||||||
#else
|
#else
|
||||||
#error No definition for DLLEXPORT
|
#error No definition for DLLEXPORT
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#ifdef __GNUC__
|
||||||
|
#include <cpuid.h>
|
||||||
|
#endif
|
||||||
|
|
||||||
|
inline void cpuid(int cpuInfo[4], int functionId) {
|
||||||
|
#if defined(_MSC_VER)
|
||||||
|
__cpuid(cpuInfo, functionId);
|
||||||
|
#elif defined(__GNUC__)
|
||||||
|
__cpuid(functionId, cpuInfo[0], cpuInfo[1], cpuInfo[2], cpuInfo[3]);
|
||||||
|
#else
|
||||||
|
#error No definition for cpuid
|
||||||
|
#endif
|
||||||
|
}
|
||||||
|
|
||||||
|
inline void cpuidex(int cpuInfo[4], int functionId, int subFunctionId) {
|
||||||
|
#if defined(_MSC_VER)
|
||||||
|
__cpuidex(cpuInfo, functionId, subFunctionId);
|
||||||
|
#elif defined(__GNUC__)
|
||||||
|
__cpuid_count(functionId, subFunctionId, cpuInfo[0], cpuInfo[1], cpuInfo[2], cpuInfo[3]);
|
||||||
|
#else
|
||||||
|
#error No definition for cpuidex
|
||||||
|
#endif
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
// MEMPTR
|
// MEMPTR
|
||||||
#include "Common/MemPtr.h"
|
#include "Common/MemPtr.h"
|
||||||
|
|
|
@ -7,19 +7,3 @@ uint32_t GetTickCount()
|
||||||
clock_gettime(CLOCK_MONOTONIC, &ts);
|
clock_gettime(CLOCK_MONOTONIC, &ts);
|
||||||
return (1000 * ts.tv_sec + ts.tv_nsec / 1000000);
|
return (1000 * ts.tv_sec + ts.tv_nsec / 1000000);
|
||||||
}
|
}
|
||||||
|
|
||||||
#include <cpuid.h>
|
|
||||||
|
|
||||||
void (__cpuid)(int __cpuVal[4], unsigned int __leaf)
|
|
||||||
{
|
|
||||||
__cpuid(__cpuVal[0], __cpuVal[1], __cpuVal[2], __cpuVal[3], __leaf);
|
|
||||||
}
|
|
||||||
#undef __cpuid
|
|
||||||
|
|
||||||
#ifdef __clang__
|
|
||||||
void __cpuidex(int __cpuid_info[4], int __leaf, int __subleaf)
|
|
||||||
{
|
|
||||||
__cpuid_count (__leaf, __subleaf, __cpuid_info[0], __cpuid_info[1],
|
|
||||||
__cpuid_info[2], __cpuid_info[3]);
|
|
||||||
}
|
|
||||||
#endif
|
|
|
@ -40,10 +40,6 @@ inline uint32_t GetExceptionError()
|
||||||
#undef Success
|
#undef Success
|
||||||
#undef ClientMessage
|
#undef ClientMessage
|
||||||
|
|
||||||
// cpu id (somewhat hacky, reorganize later)
|
|
||||||
void (__cpuid)(int __cpuVal[4], unsigned int __leaf);
|
|
||||||
void __cpuidex (int __cpuid_info[4], int __leaf, int __subleaf);
|
|
||||||
|
|
||||||
// placeholder
|
// placeholder
|
||||||
uint32_t GetTickCount();
|
uint32_t GetTickCount();
|
||||||
|
|
||||||
|
|
|
@ -62,11 +62,11 @@ void logCPUAndMemoryInfo()
|
||||||
unsigned nExIds, i = 0;
|
unsigned nExIds, i = 0;
|
||||||
char CPUBrandString[0x40];
|
char CPUBrandString[0x40];
|
||||||
// Get the information associated with each extended ID.
|
// Get the information associated with each extended ID.
|
||||||
__cpuid(CPUInfo, 0x80000000);
|
cpuid(CPUInfo, 0x80000000);
|
||||||
nExIds = CPUInfo[0];
|
nExIds = CPUInfo[0];
|
||||||
for (i = 0x80000000; i <= nExIds; ++i)
|
for (i = 0x80000000; i <= nExIds; ++i)
|
||||||
{
|
{
|
||||||
__cpuid(CPUInfo, i);
|
cpuid(CPUInfo, i);
|
||||||
// Interpret CPU brand string
|
// Interpret CPU brand string
|
||||||
if (i == 0x80000002)
|
if (i == 0x80000002)
|
||||||
memcpy(CPUBrandString, CPUInfo, sizeof(CPUInfo));
|
memcpy(CPUBrandString, CPUInfo, sizeof(CPUInfo));
|
||||||
|
@ -194,11 +194,11 @@ void mainEmulatorCommonInit()
|
||||||
PPCTimer_init();
|
PPCTimer_init();
|
||||||
// check available CPU extensions
|
// check available CPU extensions
|
||||||
int cpuInfo[4];
|
int cpuInfo[4];
|
||||||
__cpuid(cpuInfo, 0x1);
|
cpuid(cpuInfo, 0x1);
|
||||||
_cpuExtension_SSSE3 = ((cpuInfo[2] >> 9) & 1) != 0;
|
_cpuExtension_SSSE3 = ((cpuInfo[2] >> 9) & 1) != 0;
|
||||||
_cpuExtension_SSE4_1 = ((cpuInfo[2] >> 19) & 1) != 0;
|
_cpuExtension_SSE4_1 = ((cpuInfo[2] >> 19) & 1) != 0;
|
||||||
|
|
||||||
__cpuidex(cpuInfo, 0x7, 0);
|
cpuidex(cpuInfo, 0x7, 0);
|
||||||
_cpuExtension_AVX2 = ((cpuInfo[1] >> 5) & 1) != 0;
|
_cpuExtension_AVX2 = ((cpuInfo[1] >> 5) & 1) != 0;
|
||||||
|
|
||||||
#if BOOST_OS_WINDOWS
|
#if BOOST_OS_WINDOWS
|
||||||
|
|
|
@ -332,25 +332,25 @@ void InvMixColumns(aes128Ctx_t* aesCtx)
|
||||||
b = stateVal(0, 1);
|
b = stateVal(0, 1);
|
||||||
c = stateVal(0, 2);
|
c = stateVal(0, 2);
|
||||||
d = stateVal(0, 3);
|
d = stateVal(0, 3);
|
||||||
stateValU32(0) = lookupTable_multiply[a] ^ _rotl(lookupTable_multiply[b], 8) ^ _rotl(lookupTable_multiply[c], 16) ^ _rotl(lookupTable_multiply[d], 24);
|
stateValU32(0) = lookupTable_multiply[a] ^ std::rotl<uint32>(lookupTable_multiply[b], 8) ^ std::rotl<uint32>(lookupTable_multiply[c], 16) ^ std::rotl<uint32>(lookupTable_multiply[d], 24);
|
||||||
// i1
|
// i1
|
||||||
a = stateVal(1, 0);
|
a = stateVal(1, 0);
|
||||||
b = stateVal(1, 1);
|
b = stateVal(1, 1);
|
||||||
c = stateVal(1, 2);
|
c = stateVal(1, 2);
|
||||||
d = stateVal(1, 3);
|
d = stateVal(1, 3);
|
||||||
stateValU32(1) = lookupTable_multiply[a] ^ _rotl(lookupTable_multiply[b], 8) ^ _rotl(lookupTable_multiply[c], 16) ^ _rotl(lookupTable_multiply[d], 24);
|
stateValU32(1) = lookupTable_multiply[a] ^ std::rotl<uint32>(lookupTable_multiply[b], 8) ^ std::rotl<uint32>(lookupTable_multiply[c], 16) ^ std::rotl<uint32>(lookupTable_multiply[d], 24);
|
||||||
// i2
|
// i2
|
||||||
a = stateVal(2, 0);
|
a = stateVal(2, 0);
|
||||||
b = stateVal(2, 1);
|
b = stateVal(2, 1);
|
||||||
c = stateVal(2, 2);
|
c = stateVal(2, 2);
|
||||||
d = stateVal(2, 3);
|
d = stateVal(2, 3);
|
||||||
stateValU32(2) = lookupTable_multiply[a] ^ _rotl(lookupTable_multiply[b], 8) ^ _rotl(lookupTable_multiply[c], 16) ^ _rotl(lookupTable_multiply[d], 24);
|
stateValU32(2) = lookupTable_multiply[a] ^ std::rotl<uint32>(lookupTable_multiply[b], 8) ^ std::rotl<uint32>(lookupTable_multiply[c], 16) ^ std::rotl<uint32>(lookupTable_multiply[d], 24);
|
||||||
// i3
|
// i3
|
||||||
a = stateVal(3, 0);
|
a = stateVal(3, 0);
|
||||||
b = stateVal(3, 1);
|
b = stateVal(3, 1);
|
||||||
c = stateVal(3, 2);
|
c = stateVal(3, 2);
|
||||||
d = stateVal(3, 3);
|
d = stateVal(3, 3);
|
||||||
stateValU32(3) = lookupTable_multiply[a] ^ _rotl(lookupTable_multiply[b], 8) ^ _rotl(lookupTable_multiply[c], 16) ^ _rotl(lookupTable_multiply[d], 24);
|
stateValU32(3) = lookupTable_multiply[a] ^ std::rotl<uint32>(lookupTable_multiply[b], 8) ^ std::rotl<uint32>(lookupTable_multiply[c], 16) ^ std::rotl<uint32>(lookupTable_multiply[d], 24);
|
||||||
}
|
}
|
||||||
|
|
||||||
// The SubBytes Function Substitutes the values in the
|
// The SubBytes Function Substitutes the values in the
|
||||||
|
@ -837,7 +837,7 @@ void AES128_init()
|
||||||
}
|
}
|
||||||
// check if AES-NI is available
|
// check if AES-NI is available
|
||||||
int v[4];
|
int v[4];
|
||||||
__cpuid(v, 1);
|
cpuid(v, 1);
|
||||||
useAESNI = (v[2] & 0x2000000) != 0;
|
useAESNI = (v[2] & 0x2000000) != 0;
|
||||||
if (useAESNI)
|
if (useAESNI)
|
||||||
{
|
{
|
||||||
|
|
Loading…
Reference in New Issue