mirror of
https://git.suyu.dev/suyu/suyu
synced 2024-11-01 04:47:53 +00:00
4e35177e23
Implement VOTE using Nvidia's intrinsics. Documentation about these can be found here https://developer.nvidia.com/reading-between-threads-shader-intrinsics Instead of using portable ARB instructions I opted to use Nvidia intrinsics because these are the closest we have to how Tegra X1 hardware renders. To stub VOTE on non-Nvidia drivers (including nouveau) this commit simulates a GPU with a warp size of one, returning what is meaningful for the instruction being emulated: * anyThreadNV(value) -> value * allThreadsNV(value) -> value * allThreadsEqualNV(value) -> true ballotARB, also known as "uint64_t(activeThreadsNV())", emits VOTE.ANY Rd, PT, PT; on nouveau's compiler. This doesn't match exactly to Nvidia's code VOTE.ALL Rd, PT, PT; Which is emulated with activeThreadsNV() by this commit. In theory this shouldn't really matter since .ANY, .ALL and .EQ affect the predicates (set to PT on those cases) and not the registers.
102 lines
4.3 KiB
CMake
102 lines
4.3 KiB
CMake
# Gets a UTC timstamp and sets the provided variable to it
|
|
function(get_timestamp _var)
|
|
string(TIMESTAMP timestamp UTC)
|
|
set(${_var} "${timestamp}" PARENT_SCOPE)
|
|
endfunction()
|
|
|
|
list(APPEND CMAKE_MODULE_PATH "${SRC_DIR}/externals/cmake-modules")
|
|
# generate git/build information
|
|
include(GetGitRevisionDescription)
|
|
get_git_head_revision(GIT_REF_SPEC GIT_REV)
|
|
git_describe(GIT_DESC --always --long --dirty)
|
|
git_branch_name(GIT_BRANCH)
|
|
get_timestamp(BUILD_DATE)
|
|
|
|
# Generate cpp with Git revision from template
|
|
# Also if this is a CI build, add the build name (ie: Nightly, Canary) to the scm_rev file as well
|
|
set(REPO_NAME "")
|
|
set(BUILD_VERSION "0")
|
|
if (BUILD_REPOSITORY)
|
|
# regex capture the string nightly or canary into CMAKE_MATCH_1
|
|
string(REGEX MATCH "yuzu-emu/yuzu-?(.*)" OUTVAR ${BUILD_REPOSITORY})
|
|
if ("${CMAKE_MATCH_COUNT}" GREATER 0)
|
|
# capitalize the first letter of each word in the repo name.
|
|
string(REPLACE "-" ";" REPO_NAME_LIST ${CMAKE_MATCH_1})
|
|
foreach(WORD ${REPO_NAME_LIST})
|
|
string(SUBSTRING ${WORD} 0 1 FIRST_LETTER)
|
|
string(SUBSTRING ${WORD} 1 -1 REMAINDER)
|
|
string(TOUPPER ${FIRST_LETTER} FIRST_LETTER)
|
|
set(REPO_NAME "${REPO_NAME}${FIRST_LETTER}${REMAINDER}")
|
|
endforeach()
|
|
if (BUILD_TAG)
|
|
string(REGEX MATCH "${CMAKE_MATCH_1}-([0-9]+)" OUTVAR ${BUILD_TAG})
|
|
if (${CMAKE_MATCH_COUNT} GREATER 0)
|
|
set(BUILD_VERSION ${CMAKE_MATCH_1})
|
|
endif()
|
|
if (BUILD_VERSION)
|
|
# This leaves a trailing space on the last word, but we actually want that
|
|
# because of how it's styled in the title bar.
|
|
set(BUILD_FULLNAME "${REPO_NAME} ${BUILD_VERSION} ")
|
|
else()
|
|
set(BUILD_FULLNAME "")
|
|
endif()
|
|
endif()
|
|
endif()
|
|
endif()
|
|
|
|
# The variable SRC_DIR must be passed into the script (since it uses the current build directory for all values of CMAKE_*_DIR)
|
|
set(VIDEO_CORE "${SRC_DIR}/src/video_core")
|
|
set(HASH_FILES
|
|
"${VIDEO_CORE}/renderer_opengl/gl_shader_cache.cpp"
|
|
"${VIDEO_CORE}/renderer_opengl/gl_shader_cache.h"
|
|
"${VIDEO_CORE}/renderer_opengl/gl_shader_decompiler.cpp"
|
|
"${VIDEO_CORE}/renderer_opengl/gl_shader_decompiler.h"
|
|
"${VIDEO_CORE}/renderer_opengl/gl_shader_disk_cache.cpp"
|
|
"${VIDEO_CORE}/renderer_opengl/gl_shader_disk_cache.h"
|
|
"${VIDEO_CORE}/renderer_opengl/gl_shader_gen.cpp"
|
|
"${VIDEO_CORE}/renderer_opengl/gl_shader_gen.h"
|
|
"${VIDEO_CORE}/shader/decode/arithmetic.cpp"
|
|
"${VIDEO_CORE}/shader/decode/arithmetic_half.cpp"
|
|
"${VIDEO_CORE}/shader/decode/arithmetic_half_immediate.cpp"
|
|
"${VIDEO_CORE}/shader/decode/arithmetic_immediate.cpp"
|
|
"${VIDEO_CORE}/shader/decode/arithmetic_integer.cpp"
|
|
"${VIDEO_CORE}/shader/decode/arithmetic_integer_immediate.cpp"
|
|
"${VIDEO_CORE}/shader/decode/bfe.cpp"
|
|
"${VIDEO_CORE}/shader/decode/bfi.cpp"
|
|
"${VIDEO_CORE}/shader/decode/conversion.cpp"
|
|
"${VIDEO_CORE}/shader/decode/ffma.cpp"
|
|
"${VIDEO_CORE}/shader/decode/float_set.cpp"
|
|
"${VIDEO_CORE}/shader/decode/float_set_predicate.cpp"
|
|
"${VIDEO_CORE}/shader/decode/half_set.cpp"
|
|
"${VIDEO_CORE}/shader/decode/half_set_predicate.cpp"
|
|
"${VIDEO_CORE}/shader/decode/hfma2.cpp"
|
|
"${VIDEO_CORE}/shader/decode/image.cpp"
|
|
"${VIDEO_CORE}/shader/decode/integer_set.cpp"
|
|
"${VIDEO_CORE}/shader/decode/integer_set_predicate.cpp"
|
|
"${VIDEO_CORE}/shader/decode/memory.cpp"
|
|
"${VIDEO_CORE}/shader/decode/texture.cpp"
|
|
"${VIDEO_CORE}/shader/decode/other.cpp"
|
|
"${VIDEO_CORE}/shader/decode/predicate_set_predicate.cpp"
|
|
"${VIDEO_CORE}/shader/decode/predicate_set_register.cpp"
|
|
"${VIDEO_CORE}/shader/decode/register_set_predicate.cpp"
|
|
"${VIDEO_CORE}/shader/decode/shift.cpp"
|
|
"${VIDEO_CORE}/shader/decode/video.cpp"
|
|
"${VIDEO_CORE}/shader/decode/warp.cpp"
|
|
"${VIDEO_CORE}/shader/decode/xmad.cpp"
|
|
"${VIDEO_CORE}/shader/control_flow.cpp"
|
|
"${VIDEO_CORE}/shader/control_flow.h"
|
|
"${VIDEO_CORE}/shader/decode.cpp"
|
|
"${VIDEO_CORE}/shader/node.h"
|
|
"${VIDEO_CORE}/shader/node_helper.cpp"
|
|
"${VIDEO_CORE}/shader/node_helper.h"
|
|
"${VIDEO_CORE}/shader/shader_ir.cpp"
|
|
"${VIDEO_CORE}/shader/shader_ir.h"
|
|
"${VIDEO_CORE}/shader/track.cpp"
|
|
)
|
|
set(COMBINED "")
|
|
foreach (F IN LISTS HASH_FILES)
|
|
file(READ ${F} TMP)
|
|
set(COMBINED "${COMBINED}${TMP}")
|
|
endforeach()
|
|
string(MD5 SHADER_CACHE_VERSION "${COMBINED}")
|
|
configure_file("${SRC_DIR}/src/common/scm_rev.cpp.in" "scm_rev.cpp" @ONLY)
|