mirror of
				https://github.com/dolphin-emu/dolphin.git
				synced 2025-10-25 09:29:43 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			955 lines
		
	
	
	
		
			32 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			955 lines
		
	
	
	
		
			32 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| // Copyright 2011 Dolphin Emulator Project
 | |
| // SPDX-License-Identifier: GPL-2.0-or-later
 | |
| 
 | |
| #include "VideoBackends/OGL/ProgramShaderCache.h"
 | |
| 
 | |
| #include <array>
 | |
| #include <atomic>
 | |
| #include <memory>
 | |
| #include <string>
 | |
| 
 | |
| #include <fmt/format.h>
 | |
| 
 | |
| #include "Common/Align.h"
 | |
| #include "Common/Assert.h"
 | |
| #include "Common/CommonTypes.h"
 | |
| #include "Common/FileUtil.h"
 | |
| #include "Common/GL/GLContext.h"
 | |
| #include "Common/Logging/Log.h"
 | |
| #include "Common/MsgHandler.h"
 | |
| #include "Common/Version.h"
 | |
| 
 | |
| #include "Core/ConfigManager.h"
 | |
| #include "Core/System.h"
 | |
| 
 | |
| #include "VideoBackends/OGL/OGLConfig.h"
 | |
| #include "VideoBackends/OGL/OGLGfx.h"
 | |
| #include "VideoBackends/OGL/OGLShader.h"
 | |
| #include "VideoBackends/OGL/OGLStreamBuffer.h"
 | |
| #include "VideoBackends/OGL/OGLVertexManager.h"
 | |
| 
 | |
| #include "VideoCommon/AsyncShaderCompiler.h"
 | |
| #include "VideoCommon/GeometryShaderManager.h"
 | |
| #include "VideoCommon/PixelShaderManager.h"
 | |
| #include "VideoCommon/Statistics.h"
 | |
| #include "VideoCommon/VertexLoaderManager.h"
 | |
| #include "VideoCommon/VertexShaderManager.h"
 | |
| #include "VideoCommon/VideoBackendBase.h"
 | |
| #include "VideoCommon/VideoConfig.h"
 | |
| 
 | |
| namespace OGL
 | |
| {
 | |
| u32 ProgramShaderCache::s_ubo_buffer_size;
 | |
| s32 ProgramShaderCache::s_ubo_align = 1;
 | |
| GLuint ProgramShaderCache::s_attributeless_VBO = 0;
 | |
| GLuint ProgramShaderCache::s_attributeless_VAO = 0;
 | |
| GLuint ProgramShaderCache::s_last_VAO = 0;
 | |
| 
 | |
| static std::unique_ptr<StreamBuffer> s_buffer;
 | |
| static int num_failures = 0;
 | |
| 
 | |
| static GLuint CurrentProgram = 0;
 | |
| ProgramShaderCache::PipelineProgramMap ProgramShaderCache::s_pipeline_programs;
 | |
| std::mutex ProgramShaderCache::s_pipeline_program_lock;
 | |
| static std::string s_glsl_header;
 | |
| static std::atomic<u64> s_shader_counter{0};
 | |
| static thread_local bool s_is_shared_context = false;
 | |
| 
 | |
| static std::string GetGLSLVersionString()
 | |
| {
 | |
|   GlslVersion v = g_ogl_config.eSupportedGLSLVersion;
 | |
|   switch (v)
 | |
|   {
 | |
|   case GlslEs300:
 | |
|     return "#version 300 es";
 | |
|   case GlslEs310:
 | |
|     return "#version 310 es";
 | |
|   case GlslEs320:
 | |
|     return "#version 320 es";
 | |
|   case Glsl130:
 | |
|     return "#version 130";
 | |
|   case Glsl140:
 | |
|     return "#version 140";
 | |
|   case Glsl150:
 | |
|     return "#version 150";
 | |
|   case Glsl330:
 | |
|     return "#version 330";
 | |
|   case Glsl400:
 | |
|     return "#version 400";
 | |
|   case Glsl430:
 | |
|     return "#version 430";
 | |
|   case Glsl450:
 | |
|     return "#version 450";
 | |
|   default:
 | |
|     // Shouldn't ever hit this
 | |
|     return "#version ERROR";
 | |
|   }
 | |
| }
 | |
| 
 | |
| void SHADER::SetProgramVariables()
 | |
| {
 | |
|   if (g_backend_info.bSupportsBindingLayout)
 | |
|     return;
 | |
| 
 | |
|   // To set uniform blocks/uniforms, the program must be active. We restore the
 | |
|   // current binding at the end of this method to maintain the invariant.
 | |
|   glUseProgram(glprogid);
 | |
| 
 | |
|   // Bind UBO and texture samplers
 | |
|   GLint PSBlock_id = glGetUniformBlockIndex(glprogid, "PSBlock");
 | |
|   GLint VSBlock_id = glGetUniformBlockIndex(glprogid, "VSBlock");
 | |
|   GLint GSBlock_id = glGetUniformBlockIndex(glprogid, "GSBlock");
 | |
|   GLint UBERBlock_id = glGetUniformBlockIndex(glprogid, "UBERBlock");
 | |
|   if (PSBlock_id != -1)
 | |
|     glUniformBlockBinding(glprogid, PSBlock_id, 1);
 | |
|   if (VSBlock_id != -1)
 | |
|     glUniformBlockBinding(glprogid, VSBlock_id, 2);
 | |
|   if (GSBlock_id != -1)
 | |
|     glUniformBlockBinding(glprogid, GSBlock_id, 4);
 | |
|   if (UBERBlock_id != -1)
 | |
|     glUniformBlockBinding(glprogid, UBERBlock_id, 5);
 | |
| 
 | |
|   // Bind Texture Samplers
 | |
|   for (int a = 0; a < 8; ++a)
 | |
|   {
 | |
|     // Still need to get sampler locations since we aren't binding them statically in the shaders
 | |
|     int loc = glGetUniformLocation(glprogid, fmt::format("samp[{}]", a).c_str());
 | |
|     if (loc < 0)
 | |
|       loc = glGetUniformLocation(glprogid, fmt::format("samp{}", a).c_str());
 | |
|     if (loc >= 0)
 | |
|       glUniform1i(loc, a);
 | |
|   }
 | |
| 
 | |
|   // Restore previous program binding.
 | |
|   glUseProgram(CurrentProgram);
 | |
| }
 | |
| 
 | |
| void SHADER::SetProgramBindings(bool is_compute)
 | |
| {
 | |
|   if (g_ogl_config.bSupportsExplicitLayoutInShader)
 | |
|   {
 | |
|     return;
 | |
|   }
 | |
|   if (!is_compute)
 | |
|   {
 | |
|     if (g_backend_info.bSupportsDualSourceBlend)
 | |
|     {
 | |
|       // So we do support extended blending
 | |
|       // So we need to set a few more things here.
 | |
|       // Bind our out locations
 | |
|       glBindFragDataLocationIndexed(glprogid, 0, 0, "ocol0");
 | |
|       glBindFragDataLocationIndexed(glprogid, 0, 1, "ocol1");
 | |
|     }
 | |
|     // Need to set some attribute locations
 | |
|     glBindAttribLocation(glprogid, static_cast<GLuint>(ShaderAttrib::Position), "rawpos");
 | |
| 
 | |
|     glBindAttribLocation(glprogid, static_cast<GLuint>(ShaderAttrib::PositionMatrix), "posmtx");
 | |
| 
 | |
|     glBindAttribLocation(glprogid, static_cast<GLuint>(ShaderAttrib::Color0), "rawcolor0");
 | |
|     glBindAttribLocation(glprogid, static_cast<GLuint>(ShaderAttrib::Color1), "rawcolor1");
 | |
| 
 | |
|     glBindAttribLocation(glprogid, static_cast<GLuint>(ShaderAttrib::Normal), "rawnormal");
 | |
|     glBindAttribLocation(glprogid, static_cast<GLuint>(ShaderAttrib::Tangent), "rawtangent");
 | |
|     glBindAttribLocation(glprogid, static_cast<GLuint>(ShaderAttrib::Binormal), "rawbinormal");
 | |
|   }
 | |
| 
 | |
|   for (int i = 0; i < 8; i++)
 | |
|   {
 | |
|     // Per documentation: OpenGL copies the name string when glBindAttribLocation is called, so an
 | |
|     // application may free its copy of the name string immediately after the function returns.
 | |
|     glBindAttribLocation(glprogid, static_cast<GLuint>(ShaderAttrib::TexCoord0 + i),
 | |
|                          fmt::format("rawtex{}", i).c_str());
 | |
|   }
 | |
| }
 | |
| 
 | |
| void SHADER::Bind() const
 | |
| {
 | |
|   if (CurrentProgram != glprogid)
 | |
|   {
 | |
|     INCSTAT(g_stats.this_frame.num_shader_changes);
 | |
|     glUseProgram(glprogid);
 | |
|     CurrentProgram = glprogid;
 | |
|   }
 | |
| }
 | |
| 
 | |
| void SHADER::DestroyShaders()
 | |
| {
 | |
|   if (vsid)
 | |
|   {
 | |
|     glDeleteShader(vsid);
 | |
|     vsid = 0;
 | |
|   }
 | |
|   if (gsid)
 | |
|   {
 | |
|     glDeleteShader(gsid);
 | |
|     gsid = 0;
 | |
|   }
 | |
|   if (psid)
 | |
|   {
 | |
|     glDeleteShader(psid);
 | |
|     psid = 0;
 | |
|   }
 | |
| }
 | |
| 
 | |
| bool PipelineProgramKey::operator==(const PipelineProgramKey& rhs) const
 | |
| {
 | |
|   return std::tie(vertex_shader_id, geometry_shader_id, pixel_shader_id) ==
 | |
|          std::tie(rhs.vertex_shader_id, rhs.geometry_shader_id, rhs.pixel_shader_id);
 | |
| }
 | |
| 
 | |
| bool PipelineProgramKey::operator<(const PipelineProgramKey& rhs) const
 | |
| {
 | |
|   return std::tie(vertex_shader_id, geometry_shader_id, pixel_shader_id) <
 | |
|          std::tie(rhs.vertex_shader_id, rhs.geometry_shader_id, rhs.pixel_shader_id);
 | |
| }
 | |
| 
 | |
| std::size_t PipelineProgramKeyHash::operator()(const PipelineProgramKey& key) const
 | |
| {
 | |
|   // We would really want std::hash_combine for this..
 | |
|   std::hash<u64> hasher;
 | |
|   return hasher(key.vertex_shader_id) + hasher(key.geometry_shader_id) +
 | |
|          hasher(key.pixel_shader_id);
 | |
| }
 | |
| 
 | |
| StreamBuffer* ProgramShaderCache::GetUniformBuffer()
 | |
| {
 | |
|   return s_buffer.get();
 | |
| }
 | |
| 
 | |
| u32 ProgramShaderCache::GetUniformBufferAlignment()
 | |
| {
 | |
|   return s_ubo_align;
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::UploadConstants()
 | |
| {
 | |
|   auto& system = Core::System::GetInstance();
 | |
|   auto& pixel_shader_manager = system.GetPixelShaderManager();
 | |
|   auto& vertex_shader_manager = system.GetVertexShaderManager();
 | |
|   auto& geometry_shader_manager = system.GetGeometryShaderManager();
 | |
|   if (pixel_shader_manager.dirty || vertex_shader_manager.dirty || geometry_shader_manager.dirty ||
 | |
|       pixel_shader_manager.custom_constants_dirty)
 | |
|   {
 | |
|     const u32 custom_constants_size = static_cast<u32>(
 | |
|         Common::AlignUp(pixel_shader_manager.custom_constants.size(), s_ubo_align));
 | |
|     auto buffer = s_buffer->Map(s_ubo_buffer_size + custom_constants_size, s_ubo_align);
 | |
| 
 | |
|     memcpy(buffer.first, &pixel_shader_manager.constants, sizeof(PixelShaderConstants));
 | |
| 
 | |
|     u64 size = Common::AlignUp(sizeof(PixelShaderConstants), s_ubo_align);
 | |
| 
 | |
|     memcpy(buffer.first + size, &vertex_shader_manager.constants, sizeof(VertexShaderConstants));
 | |
|     size += Common::AlignUp(sizeof(VertexShaderConstants), s_ubo_align);
 | |
| 
 | |
|     if (!pixel_shader_manager.custom_constants.empty())
 | |
|     {
 | |
|       memcpy(buffer.first + size, pixel_shader_manager.custom_constants.data(),
 | |
|              pixel_shader_manager.custom_constants.size());
 | |
|       size += custom_constants_size;
 | |
|     }
 | |
| 
 | |
|     memcpy(buffer.first + size, &geometry_shader_manager.constants,
 | |
|            sizeof(GeometryShaderConstants));
 | |
| 
 | |
|     s_buffer->Unmap(s_ubo_buffer_size + custom_constants_size);
 | |
| 
 | |
|     glBindBufferRange(GL_UNIFORM_BUFFER, 1, s_buffer->m_buffer, buffer.second,
 | |
|                       sizeof(PixelShaderConstants));
 | |
|     size = Common::AlignUp(sizeof(PixelShaderConstants), s_ubo_align);
 | |
|     glBindBufferRange(GL_UNIFORM_BUFFER, 2, s_buffer->m_buffer, buffer.second + size,
 | |
|                       sizeof(VertexShaderConstants));
 | |
|     size += Common::AlignUp(sizeof(VertexShaderConstants), s_ubo_align);
 | |
| 
 | |
|     if (!pixel_shader_manager.custom_constants.empty())
 | |
|     {
 | |
|       glBindBufferRange(GL_UNIFORM_BUFFER, 3, s_buffer->m_buffer, buffer.second + size,
 | |
|                         pixel_shader_manager.custom_constants.size());
 | |
|       size += Common::AlignUp(pixel_shader_manager.custom_constants.size(), s_ubo_align);
 | |
|     }
 | |
|     glBindBufferRange(GL_UNIFORM_BUFFER, 4, s_buffer->m_buffer, buffer.second + size,
 | |
|                       sizeof(GeometryShaderConstants));
 | |
| 
 | |
|     pixel_shader_manager.dirty = false;
 | |
|     vertex_shader_manager.dirty = false;
 | |
|     geometry_shader_manager.dirty = false;
 | |
|     pixel_shader_manager.custom_constants_dirty = false;
 | |
| 
 | |
|     ADDSTAT(g_stats.this_frame.bytes_uniform_streamed, s_ubo_buffer_size + custom_constants_size);
 | |
|   }
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::UploadConstants(const void* data, u32 data_size)
 | |
| {
 | |
|   // allocate and copy
 | |
|   const u32 alloc_size = Common::AlignUp(data_size, s_ubo_align);
 | |
|   auto buffer = s_buffer->Map(alloc_size, s_ubo_align);
 | |
|   std::memcpy(buffer.first, data, data_size);
 | |
|   s_buffer->Unmap(alloc_size);
 | |
| 
 | |
|   // bind the same sub-buffer to all stages
 | |
|   for (u32 index = 1; index <= 4; index++)
 | |
|     glBindBufferRange(GL_UNIFORM_BUFFER, index, s_buffer->m_buffer, buffer.second, data_size);
 | |
| 
 | |
|   ADDSTAT(g_stats.this_frame.bytes_uniform_streamed, data_size);
 | |
| }
 | |
| 
 | |
| bool ProgramShaderCache::CompileComputeShader(SHADER& shader, std::string_view code)
 | |
| {
 | |
|   // We need to enable GL_ARB_compute_shader for drivers that support the extension,
 | |
|   // but not GLSL 4.3. Mesa is one example.
 | |
|   std::string full_code;
 | |
|   if (g_backend_info.bSupportsComputeShaders && g_ogl_config.eSupportedGLSLVersion < Glsl430)
 | |
|   {
 | |
|     full_code = "#extension GL_ARB_compute_shader : enable\n";
 | |
|   }
 | |
| 
 | |
|   full_code += code;
 | |
|   const GLuint shader_id = CompileSingleShader(GL_COMPUTE_SHADER, full_code);
 | |
|   if (!shader_id)
 | |
|     return false;
 | |
| 
 | |
|   shader.glprogid = glCreateProgram();
 | |
|   glAttachShader(shader.glprogid, shader_id);
 | |
|   shader.SetProgramBindings(true);
 | |
|   glLinkProgram(shader.glprogid);
 | |
| 
 | |
|   // original shaders aren't needed any more
 | |
|   glDeleteShader(shader_id);
 | |
| 
 | |
|   if (!CheckProgramLinkResult(shader.glprogid, full_code, {}, {}))
 | |
|   {
 | |
|     shader.Destroy();
 | |
|     return false;
 | |
|   }
 | |
| 
 | |
|   shader.SetProgramVariables();
 | |
|   return true;
 | |
| }
 | |
| 
 | |
| GLuint ProgramShaderCache::CompileSingleShader(GLenum type, std::string_view code)
 | |
| {
 | |
|   const GLuint result = glCreateShader(type);
 | |
| 
 | |
|   constexpr GLsizei num_strings = 2;
 | |
|   const std::array<const char*, num_strings> src{
 | |
|       s_glsl_header.data(),
 | |
|       code.data(),
 | |
|   };
 | |
|   const std::array<GLint, num_strings> src_sizes{
 | |
|       static_cast<GLint>(s_glsl_header.size()),
 | |
|       static_cast<GLint>(code.size()),
 | |
|   };
 | |
| 
 | |
|   glShaderSource(result, num_strings, src.data(), src_sizes.data());
 | |
|   glCompileShader(result);
 | |
| 
 | |
|   if (!CheckShaderCompileResult(result, type, code))
 | |
|   {
 | |
|     // Don't try to use this shader
 | |
|     glDeleteShader(result);
 | |
|     return 0;
 | |
|   }
 | |
| 
 | |
|   return result;
 | |
| }
 | |
| 
 | |
| bool ProgramShaderCache::CheckShaderCompileResult(GLuint id, GLenum type, std::string_view code)
 | |
| {
 | |
|   GLint compileStatus;
 | |
|   glGetShaderiv(id, GL_COMPILE_STATUS, &compileStatus);
 | |
|   GLsizei length = 0;
 | |
|   glGetShaderiv(id, GL_INFO_LOG_LENGTH, &length);
 | |
|   if (compileStatus != GL_TRUE || length > 1)
 | |
|   {
 | |
|     std::string info_log;
 | |
|     info_log.resize(length);
 | |
|     glGetShaderInfoLog(id, length, &length, &info_log[0]);
 | |
| 
 | |
|     const char* prefix = "";
 | |
|     switch (type)
 | |
|     {
 | |
|     case GL_VERTEX_SHADER:
 | |
|       prefix = "vs";
 | |
|       break;
 | |
|     case GL_GEOMETRY_SHADER:
 | |
|       prefix = "gs";
 | |
|       break;
 | |
|     case GL_FRAGMENT_SHADER:
 | |
|       prefix = "ps";
 | |
|       break;
 | |
|     case GL_COMPUTE_SHADER:
 | |
|       prefix = "cs";
 | |
|       break;
 | |
|     }
 | |
| 
 | |
|     if (compileStatus != GL_TRUE)
 | |
|     {
 | |
|       ERROR_LOG_FMT(VIDEO, "{} failed compilation:\n{}", prefix, info_log);
 | |
| 
 | |
|       std::string filename = VideoBackendBase::BadShaderFilename(prefix, num_failures++);
 | |
|       std::ofstream file;
 | |
|       File::OpenFStream(file, filename, std::ios_base::out);
 | |
|       file << s_glsl_header << code << info_log;
 | |
|       file << "\n";
 | |
|       file << "Dolphin Version: " + Common::GetScmRevStr() + "\n";
 | |
|       file << "Video Backend: " + g_video_backend->GetDisplayName();
 | |
|       file.close();
 | |
| 
 | |
|       PanicAlertFmt("Failed to compile {} shader: {}\n"
 | |
|                     "Debug info ({}, {}, {}):\n{}",
 | |
|                     prefix, filename, g_ogl_config.gl_vendor, g_ogl_config.gl_renderer,
 | |
|                     g_ogl_config.gl_version, info_log);
 | |
| 
 | |
|       return false;
 | |
|     }
 | |
| 
 | |
|     WARN_LOG_FMT(VIDEO, "{} compiled with warnings:\n{}", prefix, info_log);
 | |
|   }
 | |
| 
 | |
|   return true;
 | |
| }
 | |
| 
 | |
| bool ProgramShaderCache::CheckProgramLinkResult(GLuint id, std::string_view vcode,
 | |
|                                                 std::string_view pcode, std::string_view gcode)
 | |
| {
 | |
|   GLint linkStatus;
 | |
|   glGetProgramiv(id, GL_LINK_STATUS, &linkStatus);
 | |
|   GLsizei length = 0;
 | |
|   glGetProgramiv(id, GL_INFO_LOG_LENGTH, &length);
 | |
|   if (linkStatus != GL_TRUE || length > 1)
 | |
|   {
 | |
|     std::string info_log;
 | |
|     info_log.resize(length);
 | |
|     glGetProgramInfoLog(id, length, &length, &info_log[0]);
 | |
|     if (linkStatus != GL_TRUE)
 | |
|     {
 | |
|       ERROR_LOG_FMT(VIDEO, "Program failed linking:\n{}", info_log);
 | |
|       std::string filename = VideoBackendBase::BadShaderFilename("p", num_failures++);
 | |
|       std::ofstream file;
 | |
|       File::OpenFStream(file, filename, std::ios_base::out);
 | |
|       if (!vcode.empty())
 | |
|         file << s_glsl_header << vcode << '\n';
 | |
|       if (!gcode.empty())
 | |
|         file << s_glsl_header << gcode << '\n';
 | |
|       if (!pcode.empty())
 | |
|         file << s_glsl_header << pcode << '\n';
 | |
| 
 | |
|       file << info_log;
 | |
|       file << "\n";
 | |
|       file << "Dolphin Version: " + Common::GetScmRevStr() + "\n";
 | |
|       file << "Video Backend: " + g_video_backend->GetDisplayName();
 | |
|       file.close();
 | |
| 
 | |
|       PanicAlertFmt("Failed to link shaders: {}\n"
 | |
|                     "Debug info ({}, {}, {}):\n{}",
 | |
|                     filename, g_ogl_config.gl_vendor, g_ogl_config.gl_renderer,
 | |
|                     g_ogl_config.gl_version, info_log);
 | |
| 
 | |
|       return false;
 | |
|     }
 | |
| 
 | |
|     WARN_LOG_FMT(VIDEO, "Program linked with warnings:\n{}", info_log);
 | |
|   }
 | |
| 
 | |
|   return true;
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::Init()
 | |
| {
 | |
|   // We have to get the UBO alignment here because
 | |
|   // if we generate a buffer that isn't aligned
 | |
|   // then the UBO will fail.
 | |
|   glGetIntegerv(GL_UNIFORM_BUFFER_OFFSET_ALIGNMENT, &s_ubo_align);
 | |
| 
 | |
|   s_ubo_buffer_size =
 | |
|       static_cast<u32>(Common::AlignUp(sizeof(PixelShaderConstants), s_ubo_align) +
 | |
|                        Common::AlignUp(sizeof(VertexShaderConstants), s_ubo_align) +
 | |
|                        Common::AlignUp(sizeof(GeometryShaderConstants), s_ubo_align));
 | |
| 
 | |
|   // We multiply by *4*4 because we need to get down to basic machine units.
 | |
|   // So multiply by four to get how many floats we have from vec4s
 | |
|   // Then once more to get bytes
 | |
|   s_buffer = StreamBuffer::Create(GL_UNIFORM_BUFFER, VertexManagerBase::UNIFORM_STREAM_BUFFER_SIZE);
 | |
| 
 | |
|   CreateHeader();
 | |
|   CreateAttributelessVAO();
 | |
| 
 | |
|   CurrentProgram = 0;
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::Shutdown()
 | |
| {
 | |
|   s_buffer.reset();
 | |
| 
 | |
|   glBindVertexArray(0);
 | |
|   glDeleteBuffers(1, &s_attributeless_VBO);
 | |
|   glDeleteVertexArrays(1, &s_attributeless_VAO);
 | |
|   s_attributeless_VBO = 0;
 | |
|   s_attributeless_VAO = 0;
 | |
|   s_last_VAO = 0;
 | |
| 
 | |
|   // All pipeline programs should have been released.
 | |
|   DEBUG_ASSERT(s_pipeline_programs.empty());
 | |
|   s_pipeline_programs.clear();
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::CreateAttributelessVAO()
 | |
| {
 | |
|   glGenVertexArrays(1, &s_attributeless_VAO);
 | |
| 
 | |
|   // In a compatibility context, we require a valid, bound array buffer.
 | |
|   glGenBuffers(1, &s_attributeless_VBO);
 | |
| 
 | |
|   // Initialize the buffer with nothing. 16 floats is an arbitrary size that may work around driver
 | |
|   // issues.
 | |
|   glBindBuffer(GL_ARRAY_BUFFER, s_attributeless_VBO);
 | |
|   glBufferData(GL_ARRAY_BUFFER, sizeof(GLfloat) * 16, nullptr, GL_STATIC_DRAW);
 | |
| 
 | |
|   // We must also define vertex attribute 0.
 | |
|   glBindVertexArray(s_attributeless_VAO);
 | |
|   glVertexAttribPointer(0, 2, GL_FLOAT, GL_FALSE, 0, nullptr);
 | |
|   glEnableVertexAttribArray(0);
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::BindVertexFormat(const GLVertexFormat* vertex_format)
 | |
| {
 | |
|   u32 new_VAO = vertex_format ? vertex_format->VAO : s_attributeless_VAO;
 | |
|   if (s_last_VAO == new_VAO)
 | |
|     return;
 | |
| 
 | |
|   glBindVertexArray(new_VAO);
 | |
|   s_last_VAO = new_VAO;
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::ReBindVertexFormat()
 | |
| {
 | |
|   if (s_last_VAO)
 | |
|     glBindVertexArray(s_last_VAO);
 | |
| }
 | |
| 
 | |
| bool ProgramShaderCache::IsValidVertexFormatBound()
 | |
| {
 | |
|   return s_last_VAO != 0 && s_last_VAO != s_attributeless_VAO;
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::InvalidateVertexFormat()
 | |
| {
 | |
|   s_last_VAO = 0;
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::InvalidateVertexFormatIfBound(GLuint vao)
 | |
| {
 | |
|   if (s_last_VAO == vao)
 | |
|     s_last_VAO = 0;
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::InvalidateLastProgram()
 | |
| {
 | |
|   CurrentProgram = 0;
 | |
| }
 | |
| 
 | |
| PipelineProgram* ProgramShaderCache::GetPipelineProgram(const GLVertexFormat* vertex_format,
 | |
|                                                         const OGLShader* vertex_shader,
 | |
|                                                         const OGLShader* geometry_shader,
 | |
|                                                         const OGLShader* pixel_shader,
 | |
|                                                         const void* cache_data,
 | |
|                                                         size_t cache_data_size)
 | |
| {
 | |
|   PipelineProgramKey key = {vertex_shader ? vertex_shader->GetID() : 0,
 | |
|                             geometry_shader ? geometry_shader->GetID() : 0,
 | |
|                             pixel_shader ? pixel_shader->GetID() : 0};
 | |
|   {
 | |
|     std::lock_guard guard{s_pipeline_program_lock};
 | |
|     auto iter = s_pipeline_programs.find(key);
 | |
|     if (iter != s_pipeline_programs.end())
 | |
|     {
 | |
|       iter->second->reference_count++;
 | |
|       return iter->second.get();
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   std::unique_ptr<PipelineProgram> prog = std::make_unique<PipelineProgram>();
 | |
|   prog->key = key;
 | |
|   prog->shader.glprogid = glCreateProgram();
 | |
| 
 | |
|   // Use the cache data, if present. If this fails, we want to return an error, so the shader cache
 | |
|   // doesn't attempt to use the same binary data in the future.
 | |
|   if (cache_data_size >= sizeof(u32))
 | |
|   {
 | |
|     u32 program_binary_type;
 | |
|     std::memcpy(&program_binary_type, cache_data, sizeof(u32));
 | |
|     glProgramBinary(prog->shader.glprogid, static_cast<GLenum>(program_binary_type),
 | |
|                     static_cast<const u8*>(cache_data) + sizeof(u32),
 | |
|                     static_cast<GLsizei>(cache_data_size - sizeof(u32)));
 | |
| 
 | |
|     // Check the link status. If this fails, it means the binary was invalid.
 | |
|     GLint link_status;
 | |
|     glGetProgramiv(prog->shader.glprogid, GL_LINK_STATUS, &link_status);
 | |
|     if (link_status != GL_TRUE)
 | |
|     {
 | |
|       WARN_LOG_FMT(VIDEO, "Failed to create GL program from program binary.");
 | |
|       prog->shader.Destroy();
 | |
|       return nullptr;
 | |
|     }
 | |
| 
 | |
|     // We don't want to retrieve this binary and duplicate entries in the cache again.
 | |
|     // See the explanation in OGLPipeline.cpp.
 | |
|     prog->binary_retrieved = true;
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     // We temporarily change the vertex array to the pipeline's vertex format.
 | |
|     // This can prevent the NVIDIA OpenGL driver from recompiling on first use.
 | |
|     GLuint vao = vertex_format ? vertex_format->VAO : s_attributeless_VAO;
 | |
|     if (s_is_shared_context || vao != s_last_VAO)
 | |
|       glBindVertexArray(vao);
 | |
| 
 | |
|     // Attach shaders.
 | |
|     ASSERT(vertex_shader && vertex_shader->GetStage() == ShaderStage::Vertex);
 | |
|     ASSERT(pixel_shader && pixel_shader->GetStage() == ShaderStage::Pixel);
 | |
|     glAttachShader(prog->shader.glprogid, vertex_shader->GetGLShaderID());
 | |
|     glAttachShader(prog->shader.glprogid, pixel_shader->GetGLShaderID());
 | |
|     if (geometry_shader)
 | |
|     {
 | |
|       ASSERT(geometry_shader->GetStage() == ShaderStage::Geometry);
 | |
|       glAttachShader(prog->shader.glprogid, geometry_shader->GetGLShaderID());
 | |
|     }
 | |
| 
 | |
|     if (g_backend_info.bSupportsPipelineCacheData)
 | |
|       glProgramParameteri(prog->shader.glprogid, GL_PROGRAM_BINARY_RETRIEVABLE_HINT, GL_TRUE);
 | |
| 
 | |
|     // Link program.
 | |
|     prog->shader.SetProgramBindings(false);
 | |
|     glLinkProgram(prog->shader.glprogid);
 | |
| 
 | |
|     // Restore VAO binding after linking.
 | |
|     if (!s_is_shared_context && vao != s_last_VAO)
 | |
|       glBindVertexArray(s_last_VAO);
 | |
| 
 | |
|     if (!CheckProgramLinkResult(prog->shader.glprogid,
 | |
|                                 vertex_shader ? vertex_shader->GetSource() : std::string_view{},
 | |
|                                 geometry_shader ? geometry_shader->GetSource() : std::string_view{},
 | |
|                                 pixel_shader ? pixel_shader->GetSource() : std::string_view{}))
 | |
|     {
 | |
|       prog->shader.Destroy();
 | |
|       return nullptr;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   // Lock to insert. A duplicate program may have been created in the meantime.
 | |
|   std::lock_guard guard{s_pipeline_program_lock};
 | |
|   auto iter = s_pipeline_programs.find(key);
 | |
|   if (iter != s_pipeline_programs.end())
 | |
|   {
 | |
|     // Destroy this program, and use the one which was created first.
 | |
|     prog->shader.Destroy();
 | |
|     iter->second->reference_count++;
 | |
|     return iter->second.get();
 | |
|   }
 | |
| 
 | |
|   // Set program variables on the shader which will be returned.
 | |
|   // This is only needed for drivers which don't support binding layout.
 | |
|   prog->shader.SetProgramVariables();
 | |
| 
 | |
|   // If this is a shared context, ensure we sync before we return the program to
 | |
|   // the main thread. If we don't do this, some driver can lock up (e.g. AMD).
 | |
|   if (s_is_shared_context)
 | |
|     glFinish();
 | |
| 
 | |
|   auto ip = s_pipeline_programs.emplace(key, std::move(prog));
 | |
|   return ip.first->second.get();
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::ReleasePipelineProgram(PipelineProgram* prog)
 | |
| {
 | |
|   if (--prog->reference_count > 0)
 | |
|     return;
 | |
| 
 | |
|   prog->shader.Destroy();
 | |
| 
 | |
|   std::lock_guard guard{s_pipeline_program_lock};
 | |
|   const auto iter = s_pipeline_programs.find(prog->key);
 | |
|   ASSERT(iter != s_pipeline_programs.end() && prog == iter->second.get());
 | |
|   s_pipeline_programs.erase(iter);
 | |
| }
 | |
| 
 | |
| void ProgramShaderCache::CreateHeader()
 | |
| {
 | |
|   GlslVersion v = g_ogl_config.eSupportedGLSLVersion;
 | |
|   bool is_glsles = v >= GlslEs300;
 | |
|   std::string SupportedESPointSize;
 | |
|   std::string SupportedESTextureBuffer;
 | |
|   switch (g_ogl_config.SupportedESPointSize)
 | |
|   {
 | |
|   case EsPointSizeType::PointSizeOes:
 | |
|     SupportedESPointSize = "#extension GL_OES_geometry_point_size : enable";
 | |
|     break;
 | |
|   case EsPointSizeType::PointSizeExt:
 | |
|     SupportedESPointSize = "#extension GL_EXT_geometry_point_size : enable";
 | |
|     break;
 | |
|   case EsPointSizeType::PointSizeNone:
 | |
|   default:
 | |
|     SupportedESPointSize = "";
 | |
|     break;
 | |
|   }
 | |
| 
 | |
|   switch (g_ogl_config.SupportedESTextureBuffer)
 | |
|   {
 | |
|   case EsTexbufType::TexbufExt:
 | |
|     SupportedESTextureBuffer = "#extension GL_EXT_texture_buffer : enable";
 | |
|     break;
 | |
|   case EsTexbufType::TexbufOes:
 | |
|     SupportedESTextureBuffer = "#extension GL_OES_texture_buffer : enable";
 | |
|     break;
 | |
|   case EsTexbufType::TexbufCore:
 | |
|   case EsTexbufType::TexbufNone:
 | |
|     SupportedESTextureBuffer = "";
 | |
|     break;
 | |
|   }
 | |
| 
 | |
|   std::string earlyz_string;
 | |
|   if (g_backend_info.bSupportsEarlyZ)
 | |
|   {
 | |
|     if (g_ogl_config.bSupportsImageLoadStore)
 | |
|     {
 | |
|       earlyz_string = "#define FORCE_EARLY_Z layout(early_fragment_tests) in\n";
 | |
|     }
 | |
|     else if (g_ogl_config.bSupportsConservativeDepth)
 | |
|     {
 | |
|       // See PixelShaderGen for details about this fallback.
 | |
|       earlyz_string = "#define FORCE_EARLY_Z layout(depth_unchanged) out float gl_FragDepth\n";
 | |
|       earlyz_string += "#extension GL_ARB_conservative_depth : enable\n";
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   std::string framebuffer_fetch_string;
 | |
|   switch (g_ogl_config.SupportedFramebufferFetch)
 | |
|   {
 | |
|   case EsFbFetchType::FbFetchExt:
 | |
|     framebuffer_fetch_string = "#extension GL_EXT_shader_framebuffer_fetch: enable\n"
 | |
|                                "#define FRAGMENT_INOUT inout";
 | |
|     break;
 | |
|   case EsFbFetchType::FbFetchArm:
 | |
|     framebuffer_fetch_string = "#extension GL_ARM_shader_framebuffer_fetch: enable\n"
 | |
|                                "#define FB_FETCH_VALUE gl_LastFragColorARM\n"
 | |
|                                "#define FRAGMENT_INOUT out";
 | |
|     break;
 | |
|   case EsFbFetchType::FbFetchNone:
 | |
|     framebuffer_fetch_string = "";
 | |
|     break;
 | |
|   }
 | |
| 
 | |
|   // The sampler2DMSArray keyword is reserved in GLSL ES 3.0 and 3.1, but is available in 3.2 and
 | |
|   // with GL_OES_texture_storage_multisample_2d_array for 3.1.
 | |
|   // See https://bugs.dolphin-emu.org/issues/13198.
 | |
|   const bool use_multisample_2d_array_precision =
 | |
|       v >= GlslEs320 ||
 | |
|       g_ogl_config.SupportedMultisampleTexStorage != MultisampleTexStorageType::TexStorageNone;
 | |
| 
 | |
|   std::string binding_layout;
 | |
|   if (g_backend_info.bSupportsBindingLayout)
 | |
|   {
 | |
|     if (g_ogl_config.bSupportsExplicitLayoutInShader)
 | |
|     {
 | |
|       binding_layout =
 | |
|           "#extension GL_ARB_explicit_attrib_location : enable\n"
 | |
|           "#define ATTRIBUTE_LOCATION(x) layout(location = x)\n"
 | |
|           "#define FRAGMENT_OUTPUT_LOCATION(x) layout(location = x)\n"
 | |
|           "#define FRAGMENT_OUTPUT_LOCATION_INDEXED(x, y) layout(location = x, index = y)\n"
 | |
|           "#define UBO_BINDING(packing, x) layout(packing, binding = x)\n"
 | |
|           "#define SAMPLER_BINDING(x) layout(binding = x)\n"
 | |
|           "#define TEXEL_BUFFER_BINDING(x) layout(binding = x)\n"
 | |
|           "#define SSBO_BINDING(x) layout(std430, binding = x)\n"
 | |
|           "#define IMAGE_BINDING(format, x) layout(format, binding = x)\n";
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       binding_layout = "#define ATTRIBUTE_LOCATION(x)\n"
 | |
|                        "#define FRAGMENT_OUTPUT_LOCATION(x)\n"
 | |
|                        "#define FRAGMENT_OUTPUT_LOCATION_INDEXED(x, y)\n"
 | |
|                        "#define UBO_BINDING(packing, x) layout(packing, binding = x)\n"
 | |
|                        "#define SAMPLER_BINDING(x) layout(binding = x)\n"
 | |
|                        "#define TEXEL_BUFFER_BINDING(x) layout(binding = x)\n"
 | |
|                        "#define SSBO_BINDING(x) layout(std430, binding = x)\n"
 | |
|                        "#define IMAGE_BINDING(format, x) layout(format, binding = x)\n";
 | |
|     }
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     binding_layout = "#define ATTRIBUTE_LOCATION(x)\n"
 | |
|                      "#define FRAGMENT_OUTPUT_LOCATION(x)\n"
 | |
|                      "#define FRAGMENT_OUTPUT_LOCATION_INDEXED(x, y)\n"
 | |
|                      "#define UBO_BINDING(packing, x) layout(packing)\n"
 | |
|                      "#define SAMPLER_BINDING(x)\n"
 | |
|                      "#define TEXEL_BUFFER_BINDING(x)\n"
 | |
|                      "#define SSBO_BINDING(x) layout(std430)\n"
 | |
|                      "#define IMAGE_BINDING(format, x) layout(format)\n";
 | |
|   }
 | |
| 
 | |
|   // TODO: actually define this if using 'bSupportsExplicitLayoutInShader'
 | |
|   const std::string varying_location = "#define VARYING_LOCATION(x)\n";
 | |
| 
 | |
|   std::string shader_shuffle_string;
 | |
|   if (g_ogl_config.bSupportsKHRShaderSubgroup)
 | |
|   {
 | |
|     shader_shuffle_string = R"(
 | |
| #extension GL_KHR_shader_subgroup_basic : enable
 | |
| #extension GL_KHR_shader_subgroup_arithmetic : enable
 | |
| #extension GL_KHR_shader_subgroup_ballot : enable
 | |
| 
 | |
| #define SUPPORTS_SUBGROUP_REDUCTION 1
 | |
| #define IS_HELPER_INVOCATION gl_HelperInvocation
 | |
| #define IS_FIRST_ACTIVE_INVOCATION (subgroupElect())
 | |
| #define SUBGROUP_MIN(value) value = subgroupMin(value)
 | |
| #define SUBGROUP_MAX(value) value = subgroupMax(value)
 | |
| )";
 | |
|   }
 | |
| 
 | |
|   s_glsl_header = fmt::format(
 | |
|       "{}\n"
 | |
|       "{}\n"  // ubo
 | |
|       "{}\n"  // early-z
 | |
|       "{}\n"  // 420pack
 | |
|       "{}\n"  // msaa
 | |
|       "{}\n"  // Input/output/sampler binding
 | |
|       "{}\n"  // Varying location
 | |
|       "{}\n"  // storage buffer
 | |
|       "{}\n"  // shader5
 | |
|       "{}\n"  // SSAA
 | |
|       "{}\n"  // Geometry point size
 | |
|       "{}\n"  // AEP
 | |
|       "{}\n"  // texture buffer
 | |
|       "{}\n"  // ES texture buffer
 | |
|       "{}\n"  // ES dual source blend
 | |
|       "{}\n"  // shader image load store
 | |
|       "{}\n"  // shader framebuffer fetch
 | |
|       "{}\n"  // shader thread shuffle
 | |
|       "{}\n"  // derivative control
 | |
|       "{}\n"  // query levels
 | |
|       "{}\n"  // OES multisample texture storage
 | |
| 
 | |
|       // Precision defines for GLSL ES
 | |
|       "{}\n"
 | |
|       "{}\n"
 | |
|       "{}\n"
 | |
|       "{}\n"
 | |
|       "{}\n"
 | |
|       "{}\n"
 | |
| 
 | |
|       // Silly differences
 | |
|       "#define API_OPENGL 1\n"
 | |
|       "#define float2 vec2\n"
 | |
|       "#define float3 vec3\n"
 | |
|       "#define float4 vec4\n"
 | |
|       "#define uint2 uvec2\n"
 | |
|       "#define uint3 uvec3\n"
 | |
|       "#define uint4 uvec4\n"
 | |
|       "#define int2 ivec2\n"
 | |
|       "#define int3 ivec3\n"
 | |
|       "#define int4 ivec4\n"
 | |
|       "#define frac fract\n"
 | |
|       "#define lerp mix\n"
 | |
| 
 | |
|       ,
 | |
|       GetGLSLVersionString(), v < Glsl140 ? "#extension GL_ARB_uniform_buffer_object : enable" : "",
 | |
|       earlyz_string,
 | |
|       (g_backend_info.bSupportsBindingLayout && v < GlslEs310) ?
 | |
|           "#extension GL_ARB_shading_language_420pack : enable" :
 | |
|           "",
 | |
|       (g_ogl_config.bSupportsMSAA && v < Glsl150) ?
 | |
|           "#extension GL_ARB_texture_multisample : enable" :
 | |
|           "",
 | |
|       binding_layout.c_str(), varying_location.c_str(),
 | |
|       !is_glsles && g_backend_info.bSupportsFragmentStoresAndAtomics ?
 | |
|           "#extension GL_ARB_shader_storage_buffer_object : enable" :
 | |
|           "",
 | |
|       v < Glsl400 && g_backend_info.bSupportsGSInstancing ?
 | |
|           "#extension GL_ARB_gpu_shader5 : enable" :
 | |
|           "",
 | |
|       v < Glsl400 && g_backend_info.bSupportsSSAA ? "#extension GL_ARB_sample_shading : enable" :
 | |
|                                                     "",
 | |
|       SupportedESPointSize,
 | |
|       g_ogl_config.bSupportsAEP ? "#extension GL_ANDROID_extension_pack_es31a : enable" : "",
 | |
|       v < Glsl140 && g_backend_info.bSupportsPaletteConversion ?
 | |
|           "#extension GL_ARB_texture_buffer_object : enable" :
 | |
|           "",
 | |
|       SupportedESTextureBuffer,
 | |
|       is_glsles && g_backend_info.bSupportsDualSourceBlend ?
 | |
|           "#extension GL_EXT_blend_func_extended : enable" :
 | |
|           ""
 | |
| 
 | |
|       ,
 | |
|       g_ogl_config.bSupportsImageLoadStore &&
 | |
|               ((!is_glsles && v < Glsl430) || (is_glsles && v < GlslEs310)) ?
 | |
|           "#extension GL_ARB_shader_image_load_store : enable" :
 | |
|           "",
 | |
|       framebuffer_fetch_string, shader_shuffle_string,
 | |
|       g_backend_info.bSupportsCoarseDerivatives ? "#extension GL_ARB_derivative_control : enable" :
 | |
|                                                   "",
 | |
|       g_backend_info.bSupportsTextureQueryLevels ?
 | |
|           "#extension GL_ARB_texture_query_levels : enable" :
 | |
|           "",
 | |
|       // Note: GL_ARB_texture_storage_multisample doesn't have an #extension, as it doesn't
 | |
|       // need to change GLSL, but on GLES 3.1 sampler2DMSArray is a reserved keyword unless
 | |
|       // the extension is enabled. Thus, we don't need to check TexStorageCore/have an ARB version.
 | |
|       g_ogl_config.SupportedMultisampleTexStorage == MultisampleTexStorageType::TexStorageOes ?
 | |
|           "#extension GL_OES_texture_storage_multisample_2d_array : enable" :
 | |
|           "",
 | |
|       is_glsles ? "precision highp float;" : "", is_glsles ? "precision highp int;" : "",
 | |
|       is_glsles ? "precision highp sampler2DArray;" : "",
 | |
|       (is_glsles && g_backend_info.bSupportsPaletteConversion) ? "precision highp usamplerBuffer;" :
 | |
|                                                                  "",
 | |
|       use_multisample_2d_array_precision ? "precision highp sampler2DMSArray;" : "",
 | |
|       v >= GlslEs310 ? "precision highp image2DArray;" : "");
 | |
| }
 | |
| 
 | |
| u64 ProgramShaderCache::GenerateShaderID()
 | |
| {
 | |
|   return s_shader_counter++;
 | |
| }
 | |
| 
 | |
| bool SharedContextAsyncShaderCompiler::WorkerThreadInitMainThread(void** param)
 | |
| {
 | |
|   std::unique_ptr<GLContext> context = GetOGLGfx()->GetMainGLContext()->CreateSharedContext();
 | |
|   if (!context)
 | |
|   {
 | |
|     PanicAlertFmt("Failed to create shared context for shader compiling.");
 | |
|     return false;
 | |
|   }
 | |
| 
 | |
|   *param = context.release();
 | |
|   return true;
 | |
| }
 | |
| 
 | |
| bool SharedContextAsyncShaderCompiler::WorkerThreadInitWorkerThread(void* param)
 | |
| {
 | |
|   GLContext* context = static_cast<GLContext*>(param);
 | |
|   if (!context->MakeCurrent())
 | |
|     return false;
 | |
| 
 | |
|   s_is_shared_context = true;
 | |
| 
 | |
|   // Make the state match the main context to have a better chance of avoiding recompiles.
 | |
|   if (!context->IsGLES())
 | |
|     glEnable(GL_PROGRAM_POINT_SIZE);
 | |
|   if (g_backend_info.bSupportsClipControl)
 | |
|     glClipControl(GL_LOWER_LEFT, GL_ZERO_TO_ONE);
 | |
|   if (g_backend_info.bSupportsDepthClamp)
 | |
|   {
 | |
|     glEnable(GL_CLIP_DISTANCE0);
 | |
|     glEnable(GL_CLIP_DISTANCE1);
 | |
|     glEnable(GL_DEPTH_CLAMP);
 | |
|   }
 | |
|   if (g_backend_info.bSupportsPrimitiveRestart)
 | |
|     GLUtil::EnablePrimitiveRestart(context);
 | |
| 
 | |
|   return true;
 | |
| }
 | |
| 
 | |
| void SharedContextAsyncShaderCompiler::WorkerThreadExit(void* param)
 | |
| {
 | |
|   GLContext* context = static_cast<GLContext*>(param);
 | |
|   context->ClearCurrent();
 | |
|   delete context;
 | |
| }
 | |
| }  // namespace OGL
 |