This patch adds new arg-type parameters to `DeviceQueue::enqueue` and its overrides. This is in preparation for the Metal backend which needs this information for correct argument encoding. Ref T92212 Reviewed By: brecht Maniphest Tasks: T92212 Differential Revision: https://developer.blender.org/D13357
122 lines
4.4 KiB
C++
122 lines
4.4 KiB
C++
/*
|
|
* Copyright 2011-2021 Blender Foundation
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include "integrator/pass_accessor_gpu.h"
|
|
|
|
#include "device/queue.h"
|
|
#include "session/buffers.h"
|
|
#include "util/log.h"
|
|
|
|
CCL_NAMESPACE_BEGIN
|
|
|
|
PassAccessorGPU::PassAccessorGPU(DeviceQueue *queue,
|
|
const PassAccessInfo &pass_access_info,
|
|
float exposure,
|
|
int num_samples)
|
|
: PassAccessor(pass_access_info, exposure, num_samples), queue_(queue)
|
|
|
|
{
|
|
}
|
|
|
|
/* --------------------------------------------------------------------
|
|
* Kernel execution.
|
|
*/
|
|
|
|
void PassAccessorGPU::run_film_convert_kernels(DeviceKernel kernel,
|
|
const RenderBuffers *render_buffers,
|
|
const BufferParams &buffer_params,
|
|
const Destination &destination) const
|
|
{
|
|
KernelFilmConvert kfilm_convert;
|
|
init_kernel_film_convert(&kfilm_convert, buffer_params, destination);
|
|
|
|
const int work_size = buffer_params.window_width * buffer_params.window_height;
|
|
|
|
const int destination_stride = destination.stride != 0 ? destination.stride :
|
|
buffer_params.window_width;
|
|
|
|
const int offset = buffer_params.window_x * buffer_params.pass_stride +
|
|
buffer_params.window_y * buffer_params.stride * buffer_params.pass_stride;
|
|
|
|
if (destination.d_pixels) {
|
|
DCHECK_EQ(destination.stride, 0) << "Custom stride for float destination is not implemented.";
|
|
|
|
DeviceKernelArguments args(&kfilm_convert,
|
|
&destination.d_pixels,
|
|
&render_buffers->buffer.device_pointer,
|
|
&work_size,
|
|
&buffer_params.window_width,
|
|
&offset,
|
|
&buffer_params.stride,
|
|
&destination.offset,
|
|
&destination_stride);
|
|
|
|
queue_->enqueue(kernel, work_size, args);
|
|
}
|
|
if (destination.d_pixels_half_rgba) {
|
|
const DeviceKernel kernel_half_float = static_cast<DeviceKernel>(kernel + 1);
|
|
|
|
DeviceKernelArguments args(&kfilm_convert,
|
|
&destination.d_pixels_half_rgba,
|
|
&render_buffers->buffer.device_pointer,
|
|
&work_size,
|
|
&buffer_params.window_width,
|
|
&offset,
|
|
&buffer_params.stride,
|
|
&destination.offset,
|
|
&destination_stride);
|
|
|
|
queue_->enqueue(kernel_half_float, work_size, args);
|
|
}
|
|
|
|
queue_->synchronize();
|
|
}
|
|
|
|
/* --------------------------------------------------------------------
|
|
* Pass accessors.
|
|
*/
|
|
|
|
#define DEFINE_PASS_ACCESSOR(pass, kernel_pass) \
|
|
void PassAccessorGPU::get_pass_##pass(const RenderBuffers *render_buffers, \
|
|
const BufferParams &buffer_params, \
|
|
const Destination &destination) const \
|
|
{ \
|
|
run_film_convert_kernels( \
|
|
DEVICE_KERNEL_FILM_CONVERT_##kernel_pass, render_buffers, buffer_params, destination); \
|
|
}
|
|
|
|
/* Float (scalar) passes. */
|
|
DEFINE_PASS_ACCESSOR(depth, DEPTH);
|
|
DEFINE_PASS_ACCESSOR(mist, MIST);
|
|
DEFINE_PASS_ACCESSOR(sample_count, SAMPLE_COUNT);
|
|
DEFINE_PASS_ACCESSOR(float, FLOAT);
|
|
|
|
/* Float3 passes. */
|
|
DEFINE_PASS_ACCESSOR(light_path, LIGHT_PATH);
|
|
DEFINE_PASS_ACCESSOR(float3, FLOAT3);
|
|
|
|
/* Float4 passes. */
|
|
DEFINE_PASS_ACCESSOR(motion, MOTION);
|
|
DEFINE_PASS_ACCESSOR(cryptomatte, CRYPTOMATTE);
|
|
DEFINE_PASS_ACCESSOR(shadow_catcher, SHADOW_CATCHER);
|
|
DEFINE_PASS_ACCESSOR(shadow_catcher_matte_with_shadow, SHADOW_CATCHER_MATTE_WITH_SHADOW);
|
|
DEFINE_PASS_ACCESSOR(combined, COMBINED);
|
|
DEFINE_PASS_ACCESSOR(float4, FLOAT4);
|
|
|
|
#undef DEFINE_PASS_ACCESSOR
|
|
|
|
CCL_NAMESPACE_END
|