2021-05-20 01:58:32 +00:00
|
|
|
// Copyright 2021 yuzu Emulator Project
|
|
|
|
// Licensed under GPLv2 or any later version
|
|
|
|
// Refer to the license.txt file included.
|
|
|
|
|
|
|
|
#include "shader_recompiler/backend/bindings.h"
|
|
|
|
#include "shader_recompiler/backend/glsl/emit_context.h"
|
|
|
|
#include "shader_recompiler/frontend/ir/program.h"
|
2021-05-25 23:55:40 +00:00
|
|
|
#include "shader_recompiler/profile.h"
|
2021-05-20 01:58:32 +00:00
|
|
|
|
|
|
|
namespace Shader::Backend::GLSL {
|
2021-05-27 01:18:17 +00:00
|
|
|
namespace {
|
2021-06-03 23:15:36 +00:00
|
|
|
u32 CbufIndex(u32 offset) {
|
|
|
|
return (offset / 4) % 4;
|
|
|
|
}
|
|
|
|
|
|
|
|
char OffsetSwizzle(u32 offset) {
|
|
|
|
return "xyzw"[CbufIndex(offset)];
|
|
|
|
}
|
|
|
|
|
2021-05-27 01:18:17 +00:00
|
|
|
std::string_view InterpDecorator(Interpolation interp) {
|
|
|
|
switch (interp) {
|
|
|
|
case Interpolation::Smooth:
|
|
|
|
return "";
|
|
|
|
case Interpolation::Flat:
|
|
|
|
return "flat";
|
|
|
|
case Interpolation::NoPerspective:
|
|
|
|
return "noperspective";
|
|
|
|
}
|
|
|
|
throw InvalidArgument("Invalid interpolation {}", interp);
|
|
|
|
}
|
2021-05-28 02:28:33 +00:00
|
|
|
|
2021-06-01 03:07:13 +00:00
|
|
|
std::string_view InputArrayDecorator(Stage stage) {
|
2021-05-31 17:28:53 +00:00
|
|
|
switch (stage) {
|
|
|
|
case Stage::Geometry:
|
2021-06-01 03:07:13 +00:00
|
|
|
case Stage::TessellationControl:
|
|
|
|
case Stage::TessellationEval:
|
|
|
|
return "[]";
|
|
|
|
default:
|
|
|
|
return "";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-01 05:49:24 +00:00
|
|
|
bool StoresPerVertexAttributes(Stage stage) {
|
|
|
|
switch (stage) {
|
|
|
|
case Stage::VertexA:
|
|
|
|
case Stage::VertexB:
|
|
|
|
case Stage::Geometry:
|
|
|
|
case Stage::TessellationEval:
|
|
|
|
return true;
|
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-01 03:07:13 +00:00
|
|
|
std::string OutputDecorator(Stage stage, u32 size) {
|
|
|
|
switch (stage) {
|
|
|
|
case Stage::TessellationControl:
|
|
|
|
return fmt::format("[{}]", size);
|
2021-05-31 17:28:53 +00:00
|
|
|
default:
|
|
|
|
return "";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-05-29 05:53:32 +00:00
|
|
|
std::string_view SamplerType(TextureType type, bool is_depth) {
|
|
|
|
if (is_depth) {
|
|
|
|
switch (type) {
|
|
|
|
case TextureType::Color1D:
|
|
|
|
return "sampler1DShadow";
|
|
|
|
case TextureType::ColorArray1D:
|
|
|
|
return "sampler1DArrayShadow";
|
|
|
|
case TextureType::Color2D:
|
|
|
|
return "sampler2DShadow";
|
|
|
|
case TextureType::ColorArray2D:
|
|
|
|
return "sampler2DArrayShadow";
|
|
|
|
case TextureType::ColorCube:
|
|
|
|
return "samplerCubeShadow";
|
|
|
|
case TextureType::ColorArrayCube:
|
|
|
|
return "samplerCubeArrayShadow";
|
|
|
|
default:
|
|
|
|
fmt::print("Texture type: {}", type);
|
|
|
|
throw NotImplementedException("Texture type: {}", type);
|
|
|
|
}
|
|
|
|
}
|
2021-05-28 02:28:33 +00:00
|
|
|
switch (type) {
|
2021-05-29 05:06:29 +00:00
|
|
|
case TextureType::Color1D:
|
|
|
|
return "sampler1D";
|
|
|
|
case TextureType::ColorArray1D:
|
|
|
|
return "sampler1DArray";
|
2021-05-28 02:28:33 +00:00
|
|
|
case TextureType::Color2D:
|
|
|
|
return "sampler2D";
|
|
|
|
case TextureType::ColorArray2D:
|
|
|
|
return "sampler2DArray";
|
|
|
|
case TextureType::Color3D:
|
|
|
|
return "sampler3D";
|
2021-05-28 17:54:09 +00:00
|
|
|
case TextureType::ColorCube:
|
|
|
|
return "samplerCube";
|
2021-05-29 05:06:29 +00:00
|
|
|
case TextureType::ColorArrayCube:
|
|
|
|
return "samplerCubeArray";
|
|
|
|
case TextureType::Buffer:
|
|
|
|
return "samplerBuffer";
|
2021-05-28 02:28:33 +00:00
|
|
|
default:
|
|
|
|
throw NotImplementedException("Texture type: {}", type);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-03 00:37:24 +00:00
|
|
|
std::string_view ImageType(TextureType type) {
|
|
|
|
switch (type) {
|
|
|
|
case TextureType::Color2D:
|
|
|
|
return "uimage2D";
|
|
|
|
default:
|
|
|
|
throw NotImplementedException("Image type: {}", type);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string_view ImageFormatString(ImageFormat format) {
|
|
|
|
switch (format) {
|
|
|
|
case ImageFormat::Typeless:
|
|
|
|
return "";
|
|
|
|
case ImageFormat::R8_UINT:
|
|
|
|
return ",r8ui";
|
|
|
|
case ImageFormat::R8_SINT:
|
|
|
|
return ",r8i";
|
|
|
|
case ImageFormat::R16_UINT:
|
|
|
|
return ",r16ui";
|
|
|
|
case ImageFormat::R16_SINT:
|
|
|
|
return ",r16i";
|
|
|
|
case ImageFormat::R32_UINT:
|
|
|
|
return ",r32ui";
|
|
|
|
case ImageFormat::R32G32_UINT:
|
|
|
|
return ",rg32ui";
|
|
|
|
case ImageFormat::R32G32B32A32_UINT:
|
|
|
|
return ",rgba32ui";
|
|
|
|
default:
|
|
|
|
throw NotImplementedException("Image format: {}", format);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-01 03:07:13 +00:00
|
|
|
std::string_view GetTessMode(TessPrimitive primitive) {
|
|
|
|
switch (primitive) {
|
|
|
|
case TessPrimitive::Triangles:
|
|
|
|
return "triangles";
|
|
|
|
case TessPrimitive::Quads:
|
|
|
|
return "quads";
|
|
|
|
case TessPrimitive::Isolines:
|
|
|
|
return "isolines";
|
|
|
|
}
|
|
|
|
throw InvalidArgument("Invalid tessellation primitive {}", primitive);
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string_view GetTessSpacing(TessSpacing spacing) {
|
|
|
|
switch (spacing) {
|
|
|
|
case TessSpacing::Equal:
|
|
|
|
return "equal_spacing";
|
|
|
|
case TessSpacing::FractionalOdd:
|
|
|
|
return "fractional_odd_spacing";
|
|
|
|
case TessSpacing::FractionalEven:
|
|
|
|
return "fractional_even_spacing";
|
|
|
|
}
|
|
|
|
throw InvalidArgument("Invalid tessellation spacing {}", spacing);
|
|
|
|
}
|
|
|
|
|
2021-05-31 17:28:53 +00:00
|
|
|
std::string_view InputPrimitive(InputTopology topology) {
|
|
|
|
switch (topology) {
|
|
|
|
case InputTopology::Points:
|
|
|
|
return "points";
|
|
|
|
case InputTopology::Lines:
|
|
|
|
return "lines";
|
|
|
|
case InputTopology::LinesAdjacency:
|
|
|
|
return "lines_adjacency";
|
|
|
|
case InputTopology::Triangles:
|
|
|
|
return "triangles";
|
|
|
|
case InputTopology::TrianglesAdjacency:
|
|
|
|
return "triangles_adjacency";
|
|
|
|
}
|
|
|
|
throw InvalidArgument("Invalid input topology {}", topology);
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string_view OutputPrimitive(OutputTopology topology) {
|
|
|
|
switch (topology) {
|
|
|
|
case OutputTopology::PointList:
|
|
|
|
return "points";
|
|
|
|
case OutputTopology::LineStrip:
|
|
|
|
return "line_strip";
|
|
|
|
case OutputTopology::TriangleStrip:
|
|
|
|
return "triangle_strip";
|
|
|
|
}
|
|
|
|
throw InvalidArgument("Invalid output topology {}", topology);
|
|
|
|
}
|
2021-06-01 03:07:13 +00:00
|
|
|
|
2021-06-02 04:48:49 +00:00
|
|
|
void SetupOutPerVertex(EmitContext& ctx, std::string& header) {
|
|
|
|
if (!StoresPerVertexAttributes(ctx.stage)) {
|
2021-06-01 03:07:13 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
header += "out gl_PerVertex{";
|
2021-06-02 04:33:03 +00:00
|
|
|
header += "vec4 gl_Position;";
|
2021-06-02 04:48:49 +00:00
|
|
|
if (ctx.info.stores_point_size) {
|
2021-06-01 03:07:13 +00:00
|
|
|
header += "float gl_PointSize;";
|
|
|
|
}
|
2021-06-02 04:48:49 +00:00
|
|
|
if (ctx.info.stores_clip_distance) {
|
2021-06-01 03:07:13 +00:00
|
|
|
header += "float gl_ClipDistance[];";
|
|
|
|
}
|
2021-06-02 04:48:49 +00:00
|
|
|
if (ctx.info.stores_viewport_index && ctx.supports_viewport_layer &&
|
|
|
|
ctx.stage != Stage::Geometry) {
|
2021-06-01 05:49:24 +00:00
|
|
|
header += "int gl_ViewportIndex;";
|
|
|
|
}
|
2021-06-01 04:07:14 +00:00
|
|
|
header += "};\n";
|
2021-06-02 04:48:49 +00:00
|
|
|
if (ctx.info.stores_viewport_index && ctx.stage == Stage::Geometry) {
|
2021-06-01 05:04:32 +00:00
|
|
|
header += "out int gl_ViewportIndex;";
|
|
|
|
}
|
2021-06-01 03:07:13 +00:00
|
|
|
}
|
2021-05-27 01:18:17 +00:00
|
|
|
} // namespace
|
2021-05-20 01:58:32 +00:00
|
|
|
|
2021-05-28 00:31:03 +00:00
|
|
|
EmitContext::EmitContext(IR::Program& program, Bindings& bindings, const Profile& profile_,
|
|
|
|
const RuntimeInfo& runtime_info_)
|
|
|
|
: info{program.info}, profile{profile_}, runtime_info{runtime_info_} {
|
2021-06-02 04:48:49 +00:00
|
|
|
supports_viewport_layer = profile.support_gl_vertex_viewport_layer;
|
2021-05-22 00:56:46 +00:00
|
|
|
SetupExtensions(header);
|
2021-05-26 04:16:20 +00:00
|
|
|
stage = program.stage;
|
|
|
|
switch (program.stage) {
|
|
|
|
case Stage::VertexA:
|
|
|
|
case Stage::VertexB:
|
2021-05-28 02:28:33 +00:00
|
|
|
stage_name = "vs";
|
2021-05-26 04:16:20 +00:00
|
|
|
break;
|
|
|
|
case Stage::TessellationControl:
|
2021-06-01 03:07:13 +00:00
|
|
|
stage_name = "tsc";
|
|
|
|
header += fmt::format("layout(vertices={})out;\n", program.invocations);
|
|
|
|
break;
|
2021-05-26 04:16:20 +00:00
|
|
|
case Stage::TessellationEval:
|
2021-06-01 03:07:13 +00:00
|
|
|
stage_name = "tse";
|
|
|
|
header += fmt::format("layout({},{},{})in;\n", GetTessMode(runtime_info.tess_primitive),
|
|
|
|
GetTessSpacing(runtime_info.tess_spacing),
|
|
|
|
runtime_info.tess_clockwise ? "cw" : "ccw");
|
2021-05-26 04:16:20 +00:00
|
|
|
break;
|
|
|
|
case Stage::Geometry:
|
2021-05-28 02:28:33 +00:00
|
|
|
stage_name = "gs";
|
2021-06-01 03:07:13 +00:00
|
|
|
header += fmt::format("layout({})in;layout({},max_vertices={})out;\n",
|
2021-05-31 17:28:53 +00:00
|
|
|
InputPrimitive(runtime_info.input_topology),
|
|
|
|
OutputPrimitive(program.output_topology), program.output_vertices);
|
2021-05-26 04:16:20 +00:00
|
|
|
break;
|
|
|
|
case Stage::Fragment:
|
2021-05-28 02:28:33 +00:00
|
|
|
stage_name = "fs";
|
2021-05-26 04:16:20 +00:00
|
|
|
break;
|
|
|
|
case Stage::Compute:
|
2021-05-28 02:28:33 +00:00
|
|
|
stage_name = "cs";
|
2021-05-21 03:38:38 +00:00
|
|
|
header += fmt::format("layout(local_size_x={},local_size_y={},local_size_z={}) in;\n",
|
|
|
|
program.workgroup_size[0], program.workgroup_size[1],
|
|
|
|
program.workgroup_size[2]);
|
2021-05-26 04:16:20 +00:00
|
|
|
break;
|
2021-05-21 03:38:38 +00:00
|
|
|
}
|
2021-06-02 04:48:49 +00:00
|
|
|
SetupOutPerVertex(*this, header);
|
2021-05-26 04:16:20 +00:00
|
|
|
for (size_t index = 0; index < info.input_generics.size(); ++index) {
|
|
|
|
const auto& generic{info.input_generics[index]};
|
|
|
|
if (generic.used) {
|
2021-06-01 03:07:13 +00:00
|
|
|
header += fmt::format("layout(location={}){} in vec4 in_attr{}{};", index,
|
|
|
|
InterpDecorator(generic.interpolation), index,
|
|
|
|
InputArrayDecorator(stage));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
for (size_t index = 0; index < info.uses_patches.size(); ++index) {
|
|
|
|
if (!info.uses_patches[index]) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if (stage == Stage::TessellationControl) {
|
|
|
|
header += fmt::format("layout(location={})patch out vec4 patch{};", index, index);
|
|
|
|
} else {
|
|
|
|
header += fmt::format("layout(location={})patch in vec4 patch{};", index, index);
|
2021-05-26 04:16:20 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
for (size_t index = 0; index < info.stores_frag_color.size(); ++index) {
|
|
|
|
if (!info.stores_frag_color[index]) {
|
|
|
|
continue;
|
|
|
|
}
|
2021-05-28 17:54:09 +00:00
|
|
|
header += fmt::format("layout(location={})out vec4 frag_color{};", index, index);
|
2021-05-26 04:16:20 +00:00
|
|
|
}
|
|
|
|
for (size_t index = 0; index < info.stores_generics.size(); ++index) {
|
2021-05-31 02:42:52 +00:00
|
|
|
// TODO: Properly resolve attribute issues
|
|
|
|
if (info.stores_generics[index] || stage == Stage::VertexA || stage == Stage::VertexB) {
|
2021-06-02 04:33:03 +00:00
|
|
|
DefineGenericOutput(index, program.invocations);
|
2021-05-26 04:16:20 +00:00
|
|
|
}
|
|
|
|
}
|
2021-06-01 04:07:14 +00:00
|
|
|
header += "\n";
|
2021-05-28 02:28:33 +00:00
|
|
|
DefineConstantBuffers(bindings);
|
|
|
|
DefineStorageBuffers(bindings);
|
2021-05-27 01:18:17 +00:00
|
|
|
SetupImages(bindings);
|
2021-05-28 02:28:33 +00:00
|
|
|
DefineHelperFunctions();
|
2021-05-20 01:58:32 +00:00
|
|
|
}
|
|
|
|
|
2021-05-28 17:54:09 +00:00
|
|
|
void EmitContext::SetupExtensions(std::string&) {
|
2021-05-30 23:13:22 +00:00
|
|
|
// TODO: track this usage
|
|
|
|
header += "#extension GL_ARB_sparse_texture2 : enable\n";
|
|
|
|
header += "#extension GL_EXT_texture_shadow_lod : enable\n";
|
2021-06-03 00:37:24 +00:00
|
|
|
header += "#extension GL_EXT_shader_image_load_formatted : enable\n";
|
2021-05-22 00:56:46 +00:00
|
|
|
if (info.uses_int64) {
|
|
|
|
header += "#extension GL_ARB_gpu_shader_int64 : enable\n";
|
|
|
|
}
|
2021-05-24 22:35:37 +00:00
|
|
|
if (info.uses_int64_bit_atomics) {
|
|
|
|
header += "#extension GL_NV_shader_atomic_int64 : enable\n";
|
|
|
|
}
|
|
|
|
if (info.uses_atomic_f32_add) {
|
|
|
|
header += "#extension GL_NV_shader_atomic_float : enable\n";
|
|
|
|
}
|
|
|
|
if (info.uses_atomic_f16x2_add || info.uses_atomic_f16x2_min || info.uses_atomic_f16x2_max) {
|
|
|
|
header += "#extension NV_shader_atomic_fp16_vector : enable\n";
|
|
|
|
}
|
2021-05-25 05:52:02 +00:00
|
|
|
if (info.uses_fp16) {
|
2021-05-25 23:55:40 +00:00
|
|
|
if (profile.support_gl_nv_gpu_shader_5) {
|
|
|
|
header += "#extension GL_NV_gpu_shader5 : enable\n";
|
|
|
|
}
|
|
|
|
if (profile.support_gl_amd_gpu_shader_half_float) {
|
|
|
|
header += "#extension GL_AMD_gpu_shader_half_float : enable\n";
|
|
|
|
}
|
2021-05-25 05:52:02 +00:00
|
|
|
}
|
2021-05-29 01:24:52 +00:00
|
|
|
if (info.uses_subgroup_invocation_id || info.uses_subgroup_mask || info.uses_subgroup_vote ||
|
|
|
|
info.uses_subgroup_shuffles || info.uses_fswzadd) {
|
|
|
|
header += "#extension GL_ARB_shader_ballot : enable\n";
|
2021-05-30 04:08:39 +00:00
|
|
|
header += "#extension GL_ARB_shader_group_vote : enable\n";
|
2021-05-30 04:53:26 +00:00
|
|
|
if (!info.uses_int64) {
|
|
|
|
header += "#extension GL_ARB_gpu_shader_int64 : enable\n";
|
|
|
|
}
|
2021-05-29 01:24:52 +00:00
|
|
|
}
|
2021-06-02 04:48:49 +00:00
|
|
|
if (info.stores_viewport_index && supports_viewport_layer && stage != Stage::Geometry) {
|
2021-05-31 17:28:53 +00:00
|
|
|
header += "#extension GL_ARB_shader_viewport_layer_array : enable\n";
|
|
|
|
}
|
2021-05-22 00:56:46 +00:00
|
|
|
}
|
|
|
|
|
2021-05-28 02:28:33 +00:00
|
|
|
void EmitContext::DefineConstantBuffers(Bindings& bindings) {
|
2021-05-20 01:58:32 +00:00
|
|
|
if (info.constant_buffer_descriptors.empty()) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
for (const auto& desc : info.constant_buffer_descriptors) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += fmt::format(
|
|
|
|
"layout(std140,binding={}) uniform {}_cbuf_{}{{vec4 {}_cbuf{}[{}];}};",
|
2021-05-28 02:28:33 +00:00
|
|
|
bindings.uniform_buffer, stage_name, desc.index, stage_name, desc.index, 4 * 1024);
|
|
|
|
bindings.uniform_buffer += desc.count;
|
2021-05-21 03:38:38 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-05-28 02:28:33 +00:00
|
|
|
void EmitContext::DefineStorageBuffers(Bindings& bindings) {
|
2021-05-21 03:38:38 +00:00
|
|
|
if (info.storage_buffers_descriptors.empty()) {
|
|
|
|
return;
|
|
|
|
}
|
2021-05-31 00:02:44 +00:00
|
|
|
u32 index{};
|
2021-05-21 03:38:38 +00:00
|
|
|
for (const auto& desc : info.storage_buffers_descriptors) {
|
2021-05-31 00:02:44 +00:00
|
|
|
header += fmt::format("layout(std430,binding={}) buffer {}_ssbo_{}{{uint {}_ssbo{}[];}};",
|
|
|
|
bindings.storage_buffer, stage_name, bindings.storage_buffer,
|
|
|
|
stage_name, index);
|
2021-05-28 02:28:33 +00:00
|
|
|
bindings.storage_buffer += desc.count;
|
2021-05-31 00:02:44 +00:00
|
|
|
index += desc.count;
|
2021-05-20 01:58:32 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-02 04:33:03 +00:00
|
|
|
void EmitContext::DefineGenericOutput(size_t index, u32 invocations) {
|
|
|
|
static constexpr std::string_view swizzle{"xyzw"};
|
|
|
|
const size_t base_index{static_cast<size_t>(IR::Attribute::Generic0X) + index * 4};
|
|
|
|
u32 element{0};
|
|
|
|
while (element < 4) {
|
|
|
|
std::string definition{fmt::format("layout(location={}", index)};
|
|
|
|
const u32 remainder{4 - element};
|
|
|
|
const TransformFeedbackVarying* xfb_varying{};
|
|
|
|
if (!runtime_info.xfb_varyings.empty()) {
|
|
|
|
xfb_varying = &runtime_info.xfb_varyings[base_index + element];
|
|
|
|
xfb_varying = xfb_varying && xfb_varying->components > 0 ? xfb_varying : nullptr;
|
|
|
|
}
|
|
|
|
const u32 num_components{xfb_varying ? xfb_varying->components : remainder};
|
|
|
|
if (element > 0) {
|
|
|
|
definition += fmt::format(",component={}", element);
|
|
|
|
}
|
|
|
|
if (xfb_varying) {
|
|
|
|
definition +=
|
|
|
|
fmt::format(",xfb_buffer={},xfb_stride={},xfb_offset={}", xfb_varying->buffer,
|
|
|
|
xfb_varying->stride, xfb_varying->offset);
|
|
|
|
}
|
|
|
|
std::string name{fmt::format("out_attr{}", index)};
|
|
|
|
if (num_components < 4 || element > 0) {
|
|
|
|
name += fmt::format("_{}", swizzle.substr(element, num_components));
|
|
|
|
}
|
|
|
|
const auto type{num_components == 1 ? "float" : fmt::format("vec{}", num_components)};
|
|
|
|
definition += fmt::format(")out {} {}{};", type, name, OutputDecorator(stage, invocations));
|
|
|
|
header += definition;
|
|
|
|
|
|
|
|
const GenericElementInfo element_info{
|
|
|
|
.name = name,
|
|
|
|
.first_element = element,
|
|
|
|
.num_components = num_components,
|
|
|
|
};
|
|
|
|
std::fill_n(output_generics[index].begin() + element, num_components, element_info);
|
|
|
|
element += num_components;
|
|
|
|
}
|
|
|
|
header += "\n";
|
|
|
|
}
|
|
|
|
|
2021-05-24 22:35:37 +00:00
|
|
|
void EmitContext::DefineHelperFunctions() {
|
2021-06-03 23:15:36 +00:00
|
|
|
header += "\n#define ftoi floatBitsToInt\n#define ftou floatBitsToUint\n"
|
|
|
|
"#define itof intBitsToFloat\n#define utof uintBitsToFloat\n";
|
2021-05-30 18:31:59 +00:00
|
|
|
if (info.uses_global_increment || info.uses_shared_increment) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasIncrement(uint op_a,uint op_b){return(op_a>=op_b)?0u:(op_a+1u);}\n";
|
2021-05-24 22:35:37 +00:00
|
|
|
}
|
2021-05-30 18:31:59 +00:00
|
|
|
if (info.uses_global_decrement || info.uses_shared_decrement) {
|
2021-06-02 04:33:03 +00:00
|
|
|
header += "uint CasDecrement(uint op_a,uint "
|
|
|
|
"op_b){return(op_a==0||op_a>op_b)?op_b:(op_a-1u);}\n";
|
2021-05-24 22:35:37 +00:00
|
|
|
}
|
2021-05-25 05:35:30 +00:00
|
|
|
if (info.uses_atomic_f32_add) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasFloatAdd(uint op_a,float op_b){return "
|
2021-06-03 23:15:36 +00:00
|
|
|
"ftou(utof(op_a)+op_b);}\n";
|
2021-05-25 05:35:30 +00:00
|
|
|
}
|
|
|
|
if (info.uses_atomic_f32x2_add) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasFloatAdd32x2(uint op_a,vec2 op_b){return "
|
|
|
|
"packHalf2x16(unpackHalf2x16(op_a)+op_b);}\n";
|
2021-05-25 05:35:30 +00:00
|
|
|
}
|
|
|
|
if (info.uses_atomic_f32x2_min) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasFloatMin32x2(uint op_a,vec2 op_b){return "
|
|
|
|
"packHalf2x16(min(unpackHalf2x16(op_a),op_b));}\n";
|
2021-05-25 05:35:30 +00:00
|
|
|
}
|
|
|
|
if (info.uses_atomic_f32x2_max) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasFloatMax32x2(uint op_a,vec2 op_b){return "
|
|
|
|
"packHalf2x16(max(unpackHalf2x16(op_a),op_b));}\n";
|
2021-05-25 05:35:30 +00:00
|
|
|
}
|
2021-05-25 05:52:02 +00:00
|
|
|
if (info.uses_atomic_f16x2_add) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasFloatAdd16x2(uint op_a,f16vec2 op_b){return "
|
|
|
|
"packFloat2x16(unpackFloat2x16(op_a)+op_b);}\n";
|
2021-05-25 05:52:02 +00:00
|
|
|
}
|
|
|
|
if (info.uses_atomic_f16x2_min) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasFloatMin16x2(uint op_a,f16vec2 op_b){return "
|
|
|
|
"packFloat2x16(min(unpackFloat2x16(op_a),op_b));}\n";
|
2021-05-25 05:52:02 +00:00
|
|
|
}
|
|
|
|
if (info.uses_atomic_f16x2_max) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasFloatMax16x2(uint op_a,f16vec2 op_b){return "
|
|
|
|
"packFloat2x16(max(unpackFloat2x16(op_a),op_b));}\n";
|
2021-05-25 05:52:02 +00:00
|
|
|
}
|
2021-05-26 02:13:50 +00:00
|
|
|
if (info.uses_atomic_s32_min) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasMinS32(uint op_a,uint op_b){return uint(min(int(op_a),int(op_b)));}";
|
2021-05-26 02:13:50 +00:00
|
|
|
}
|
|
|
|
if (info.uses_atomic_s32_max) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += "uint CasMaxS32(uint op_a,uint op_b){return uint(max(int(op_a),int(op_b)));}";
|
2021-05-26 02:13:50 +00:00
|
|
|
}
|
2021-06-03 23:15:36 +00:00
|
|
|
if (info.uses_global_memory) {
|
|
|
|
std::string write_func{"void WriteGlobal32(uint64_t addr,uint data){\n"};
|
|
|
|
std::string write_func_64{"void WriteGlobal64(uint64_t addr,uvec2 data){\n"};
|
|
|
|
std::string write_func_128{"void WriteGlobal128(uint64_t addr,uvec4 data){\n"};
|
|
|
|
|
|
|
|
std::string load_func{"uint LoadGlobal32(uint64_t addr){\n"};
|
|
|
|
std::string load_func_64{"uvec2 LoadGlobal64(uint64_t addr){\n"};
|
|
|
|
std::string load_func_128{"uvec4 LoadGlobal128(uint64_t addr){\n"};
|
|
|
|
const size_t num_buffers{info.storage_buffers_descriptors.size()};
|
|
|
|
for (size_t index = 0; index < num_buffers; ++index) {
|
|
|
|
if (!info.nvn_buffer_used[index]) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
const auto& ssbo{info.storage_buffers_descriptors[index]};
|
|
|
|
const u32 size_cbuf_offset{ssbo.cbuf_offset + 8};
|
|
|
|
const auto ssbo_addr{fmt::format("ssbo_addr{}", index)};
|
|
|
|
const auto cbuf{fmt::format("{}_cbuf{}", stage_name, ssbo.cbuf_index)};
|
|
|
|
const auto cbuf_value{fmt::format(
|
|
|
|
"uint64_t {}=packUint2x32(uvec2(ftou({}[{}].{}),ftou({}[{}].{})));", ssbo_addr,
|
|
|
|
cbuf, ssbo.cbuf_offset / 16, OffsetSwizzle(ssbo.cbuf_offset), cbuf,
|
|
|
|
(ssbo.cbuf_offset + 4) / 16, OffsetSwizzle(ssbo.cbuf_offset + 4))};
|
|
|
|
|
|
|
|
write_func += cbuf_value;
|
|
|
|
write_func_64 += cbuf_value;
|
|
|
|
write_func_128 += cbuf_value;
|
|
|
|
load_func += cbuf_value;
|
|
|
|
load_func_64 += cbuf_value;
|
|
|
|
load_func_128 += cbuf_value;
|
|
|
|
const auto ssbo_size{fmt::format("ftou({}[{}].{}),ftou({}[{}].{})", cbuf,
|
|
|
|
size_cbuf_offset / 16, OffsetSwizzle(size_cbuf_offset),
|
|
|
|
cbuf, (size_cbuf_offset + 4) / 16,
|
|
|
|
OffsetSwizzle(size_cbuf_offset + 4))};
|
|
|
|
const auto comparison{fmt::format("if((addr>={})&&(addr<({}+\nuint64_t(uvec2({}))))){{",
|
|
|
|
ssbo_addr, ssbo_addr, ssbo_size)};
|
|
|
|
write_func += comparison;
|
|
|
|
write_func_64 += comparison;
|
|
|
|
write_func_128 += comparison;
|
|
|
|
load_func += comparison;
|
|
|
|
load_func_64 += comparison;
|
|
|
|
load_func_128 += comparison;
|
|
|
|
|
|
|
|
const auto ssbo_name{fmt::format("{}_ssbo{}", stage_name, index)};
|
|
|
|
write_func += fmt::format("{}[uint(addr-{})>>2]=data;return;}}", ssbo_name, ssbo_addr);
|
|
|
|
write_func_64 +=
|
|
|
|
fmt::format("{}[uint(addr-{})>>2]=data.x;{}[uint(addr-{}+4)>>2]=data.y;return;}}",
|
|
|
|
ssbo_name, ssbo_addr, ssbo_name, ssbo_addr);
|
|
|
|
write_func_128 +=
|
|
|
|
fmt::format("{}[uint(addr-{})>>2]=data.x;{}[uint(addr-{}+4)>>2]=data.y;{}[uint("
|
|
|
|
"addr-{}+8)>>2]=data.z;{}[uint(addr-{}+12)>>2]=data.w;return;}}",
|
|
|
|
ssbo_name, ssbo_addr, ssbo_name, ssbo_addr, ssbo_name, ssbo_addr,
|
|
|
|
ssbo_name, ssbo_addr);
|
|
|
|
load_func += fmt::format("return {}[uint(addr-{})>>2];}}", ssbo_name, ssbo_addr);
|
|
|
|
load_func_64 +=
|
|
|
|
fmt::format("return uvec2({}[uint(addr-{})>>2],{}[uint(addr-{}+4)>>2]);}}",
|
|
|
|
ssbo_name, ssbo_addr, ssbo_name, ssbo_addr);
|
|
|
|
load_func_128 += fmt::format("return "
|
|
|
|
"uvec4({}[uint(addr-{})>>2],{}[uint(addr-{}+4)>>2],{}["
|
|
|
|
"uint(addr-{}+8)>>2],{}[uint(addr-{}+12)>>2]);}}",
|
|
|
|
ssbo_name, ssbo_addr, ssbo_name, ssbo_addr, ssbo_name,
|
|
|
|
ssbo_addr, ssbo_name, ssbo_addr);
|
|
|
|
}
|
|
|
|
write_func += "}\n";
|
|
|
|
write_func_64 += "}\n";
|
|
|
|
write_func_128 += "}\n";
|
|
|
|
load_func += "return 0u;}\n";
|
|
|
|
load_func_64 += "return uvec2(0);}\n";
|
|
|
|
load_func_128 += "return uvec4(0);}\n";
|
|
|
|
header += write_func;
|
|
|
|
header += write_func_64;
|
|
|
|
header += write_func_128;
|
|
|
|
header += load_func;
|
|
|
|
header += load_func_64;
|
|
|
|
header += load_func_128;
|
|
|
|
}
|
2021-05-24 22:35:37 +00:00
|
|
|
}
|
|
|
|
|
2021-05-27 01:18:17 +00:00
|
|
|
void EmitContext::SetupImages(Bindings& bindings) {
|
|
|
|
image_buffer_bindings.reserve(info.image_buffer_descriptors.size());
|
|
|
|
for (const auto& desc : info.image_buffer_descriptors) {
|
2021-06-03 00:37:24 +00:00
|
|
|
const auto indices{bindings.image + desc.count};
|
|
|
|
for (u32 index = bindings.image; index < indices; ++index) {
|
|
|
|
header += fmt::format("layout(binding={}) uniform uimageBuffer img{};", bindings.image,
|
|
|
|
index);
|
|
|
|
}
|
2021-05-27 01:18:17 +00:00
|
|
|
image_buffer_bindings.push_back(bindings.image);
|
|
|
|
bindings.image += desc.count;
|
|
|
|
}
|
|
|
|
image_bindings.reserve(info.image_descriptors.size());
|
|
|
|
for (const auto& desc : info.image_descriptors) {
|
|
|
|
image_bindings.push_back(bindings.image);
|
2021-06-03 00:37:24 +00:00
|
|
|
const auto format{ImageFormatString(desc.format)};
|
|
|
|
const auto image_type{ImageType(desc.type)};
|
|
|
|
const auto qualifier{desc.is_written ? "" : "readonly "};
|
|
|
|
const auto indices{bindings.image + desc.count};
|
|
|
|
for (u32 index = bindings.image; index < indices; ++index) {
|
|
|
|
header += fmt::format("layout(binding={}{})uniform {}{} img{};", bindings.image, format,
|
|
|
|
qualifier, image_type, index);
|
|
|
|
}
|
2021-05-27 01:18:17 +00:00
|
|
|
bindings.image += desc.count;
|
|
|
|
}
|
|
|
|
texture_buffer_bindings.reserve(info.texture_buffer_descriptors.size());
|
|
|
|
for (const auto& desc : info.texture_buffer_descriptors) {
|
|
|
|
texture_buffer_bindings.push_back(bindings.texture);
|
2021-05-31 05:12:52 +00:00
|
|
|
const auto sampler_type{SamplerType(TextureType::Buffer, false)};
|
|
|
|
const auto indices{bindings.texture + desc.count};
|
|
|
|
for (u32 index = bindings.texture; index < indices; ++index) {
|
|
|
|
header += fmt::format("layout(binding={}) uniform {} tex{};", bindings.texture,
|
|
|
|
sampler_type, index);
|
|
|
|
}
|
2021-05-27 01:18:17 +00:00
|
|
|
bindings.texture += desc.count;
|
|
|
|
}
|
|
|
|
texture_bindings.reserve(info.texture_descriptors.size());
|
|
|
|
for (const auto& desc : info.texture_descriptors) {
|
2021-05-29 05:53:32 +00:00
|
|
|
const auto sampler_type{SamplerType(desc.type, desc.is_depth)};
|
2021-05-27 01:18:17 +00:00
|
|
|
texture_bindings.push_back(bindings.texture);
|
|
|
|
const auto indices{bindings.texture + desc.count};
|
|
|
|
for (u32 index = bindings.texture; index < indices; ++index) {
|
2021-05-28 17:54:09 +00:00
|
|
|
header += fmt::format("layout(binding={}) uniform {} tex{};", bindings.texture,
|
|
|
|
sampler_type, index);
|
2021-05-27 01:18:17 +00:00
|
|
|
}
|
|
|
|
bindings.texture += desc.count;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-05-20 01:58:32 +00:00
|
|
|
} // namespace Shader::Backend::GLSL
|