Files
test/source/blender/gpu/intern/gpu_shader_private.hh
Miguel Pozo e6638d6e5e Refactor: GPU: GPUMaterial & GPUPass compilation
Cleanup and simplification of GPUMaterial and GPUPass compilation.
See #133674 for details/goals.

- Remove the `draw_manage_shader` thread.
  Deferred compilation is now handled by the gpu::ShaderCompiler
  through the batch compilation API.
  Batch management is handled by the `GPUPassCache`.
- Simplify `GPUMaterial` status tracking so it just queries the
  `GPUPass` status.
- Split the `GPUPass` and the `GPUCodegen` code.
- Replaced the (broken) `GPU_material_recalc_flag_get` with the new
  `GPU_pass_compilation_timestamp`.
- Add the `GPU_pass_cache_wait_for_all` and
  `GPU_shader_batch_wait_for_all`, and remove the busy waits from
   EEVEE.
- Remove many unused functions, properties, includes...

Pull Request: https://projects.blender.org/blender/blender/pulls/135637
2025-05-22 17:53:22 +02:00

277 lines
8.3 KiB
C++

/* SPDX-FileCopyrightText: 2023 Blender Authors
*
* SPDX-License-Identifier: GPL-2.0-or-later */
/** \file
* \ingroup gpu
*/
#pragma once
#include "BLI_map.hh"
#include "BLI_span.hh"
#include "BLI_string_ref.hh"
#include "GPU_shader.hh"
#include "GPU_worker.hh"
#include "gpu_shader_create_info.hh"
#include "gpu_shader_interface.hh"
#include <deque>
#include <string>
namespace blender::gpu {
class GPULogParser;
class Context;
/* Set to 1 to log the full source of shaders that fail to compile. */
#define DEBUG_LOG_SHADER_SRC_ON_ERROR 0
/**
* Compilation is done on a list of GLSL sources. This list contains placeholders that should be
* provided by the backend shader. These defines contains the locations where the backend can patch
* the sources.
*/
#define SOURCES_INDEX_VERSION 0
#define SOURCES_INDEX_SPECIALIZATION_CONSTANTS 1
/**
* Implementation of shader compilation and uniforms handling.
* Base class which is then specialized for each implementation (GL, VK, ...).
*/
class Shader {
public:
/** Uniform & attribute locations for shader. */
ShaderInterface *interface = nullptr;
/** Bit-set indicating the frame-buffer color attachments that this shader writes to. */
uint16_t fragment_output_bits = 0;
/* Default specialization constants state as defined inside ShaderCreateInfo.
* Should be considered as const after init(). */
std::unique_ptr<const shader::SpecializationConstants> constants;
/* WORKAROUND: True if this shader is a polyline shader and needs an appropriate setup to render.
* Eventually, in the future, we should modify the user code instead of relying on such hacks. */
bool is_polyline = false;
protected:
/** For debugging purpose. */
char name[64];
/* Parent shader can be used for shaders which are derived from the same source material.
* The child shader can pull information from its parent to prepare additional resources
* such as PSOs upfront. This enables asynchronous PSO compilation which mitigates stuttering
* when updating new materials. */
Shader *parent_shader_ = nullptr;
public:
Shader(const char *name);
virtual ~Shader();
/* TODO: Remove `is_batch_compilation`. */
virtual void init(const shader::ShaderCreateInfo &info, bool is_batch_compilation) = 0;
virtual void vertex_shader_from_glsl(MutableSpan<StringRefNull> sources) = 0;
virtual void geometry_shader_from_glsl(MutableSpan<StringRefNull> sources) = 0;
virtual void fragment_shader_from_glsl(MutableSpan<StringRefNull> sources) = 0;
virtual void compute_shader_from_glsl(MutableSpan<StringRefNull> sources) = 0;
virtual bool finalize(const shader::ShaderCreateInfo *info = nullptr) = 0;
/* Pre-warms PSOs using parent shader's cached PSO descriptors. Limit specifies maximum PSOs to
* warm. If -1, compiles all PSO permutations in parent shader.
*
* See `GPU_shader_warm_cache(..)` in `GPU_shader.hh` for more information. */
virtual void warm_cache(int limit) = 0;
virtual void bind(const shader::SpecializationConstants *constants_state) = 0;
virtual void unbind() = 0;
virtual void uniform_float(int location, int comp_len, int array_size, const float *data) = 0;
virtual void uniform_int(int location, int comp_len, int array_size, const int *data) = 0;
/* Add specialization constant declarations to shader instance. */
void specialization_constants_init(const shader::ShaderCreateInfo &info);
std::string defines_declare(const shader::ShaderCreateInfo &info) const;
virtual std::string resources_declare(const shader::ShaderCreateInfo &info) const = 0;
virtual std::string vertex_interface_declare(const shader::ShaderCreateInfo &info) const = 0;
virtual std::string fragment_interface_declare(const shader::ShaderCreateInfo &info) const = 0;
virtual std::string geometry_interface_declare(const shader::ShaderCreateInfo &info) const = 0;
virtual std::string geometry_layout_declare(const shader::ShaderCreateInfo &info) const = 0;
virtual std::string compute_layout_declare(const shader::ShaderCreateInfo &info) const = 0;
StringRefNull name_get() const
{
return name;
}
void parent_set(Shader *parent)
{
parent_shader_ = parent;
}
Shader *parent_get() const
{
return parent_shader_;
}
static void set_srgb_uniform(Context *ctx, GPUShader *shader);
static void set_framebuffer_srgb_target(int use_srgb_to_linear);
protected:
void print_log(Span<StringRefNull> sources,
const char *log,
const char *stage,
bool error,
GPULogParser *parser);
};
/* Syntactic sugar. */
static inline GPUShader *wrap(Shader *vert)
{
return reinterpret_cast<GPUShader *>(vert);
}
static inline Shader *unwrap(GPUShader *vert)
{
return reinterpret_cast<Shader *>(vert);
}
static inline const Shader *unwrap(const GPUShader *vert)
{
return reinterpret_cast<const Shader *>(vert);
}
class ShaderCompiler {
struct Sources {
std::string vert;
std::string geom;
std::string frag;
std::string comp;
};
struct Batch {
Vector<Shader *> shaders;
Vector<const shader::ShaderCreateInfo *> infos;
Vector<ShaderSpecialization> specializations;
std::atomic<int> pending_compilations = 0;
std::atomic<bool> is_cancelled = false;
bool is_specialization_batch()
{
return !specializations.is_empty();
}
bool is_ready()
{
BLI_assert(pending_compilations >= 0);
return pending_compilations == 0;
}
void free_shaders()
{
for (Shader *shader : shaders) {
if (shader) {
GPU_shader_free(wrap(shader));
}
}
shaders.clear();
}
};
Map<BatchHandle, Batch *> batches_;
std::mutex mutex_;
std::condition_variable compilation_finished_notification_;
struct ParallelWork {
Batch *batch = nullptr;
int shader_index = 0;
};
std::deque<ParallelWork> compilation_queue_;
std::unique_ptr<GPUWorker> compilation_worker_;
bool support_specializations_;
void run_thread();
BatchHandle next_batch_handle_ = 1;
protected:
/* Must be called earlier from the destructor of the subclass if the compilation process relies
* on subclass resources. */
void destruct_compilation_worker()
{
compilation_worker_.reset();
}
public:
ShaderCompiler(uint32_t threads_count = 1,
GPUWorker::ContextType context_type = GPUWorker::ContextType::PerThread,
bool support_specializations = false);
virtual ~ShaderCompiler();
Shader *compile(const shader::ShaderCreateInfo &info, bool is_batch_compilation);
virtual Shader *compile_shader(const shader::ShaderCreateInfo &info);
virtual void specialize_shader(ShaderSpecialization & /*specialization*/){};
BatchHandle batch_compile(Span<const shader::ShaderCreateInfo *> &infos);
void batch_cancel(BatchHandle &handle);
bool batch_is_ready(BatchHandle handle);
Vector<Shader *> batch_finalize(BatchHandle &handle);
SpecializationBatchHandle precompile_specializations(Span<ShaderSpecialization> specializations);
bool specialization_batch_is_ready(SpecializationBatchHandle &handle);
void wait_for_all();
};
enum class Severity {
Unknown,
Warning,
Error,
Note,
};
struct LogCursor {
int source = -1;
int row = -1;
int column = -1;
StringRef file_name_and_error_line = {};
};
struct GPULogItem {
LogCursor cursor;
Severity severity = Severity::Unknown;
};
class GPULogParser {
public:
virtual const char *parse_line(const char *source_combined,
const char *log_line,
GPULogItem &log_item) = 0;
protected:
const char *skip_severity(const char *log_line,
GPULogItem &log_item,
const char *error_msg,
const char *warning_msg,
const char *note_msg) const;
const char *skip_separators(const char *log_line, const StringRef separators) const;
const char *skip_until(const char *log_line, char stop_char) const;
bool at_number(const char *log_line) const;
bool at_any(const char *log_line, const StringRef chars) const;
int parse_number(const char *log_line, const char **r_new_position) const;
MEM_CXX_CLASS_ALLOC_FUNCS("GPULogParser");
};
void printf_begin(Context *ctx);
void printf_end(Context *ctx);
} // namespace blender::gpu
/* XXX do not use it. Special hack to use OCIO with batch API. */
GPUShader *immGetShader();