2015-12-30 17:54:02 +05:00
|
|
|
/*
|
|
|
|
|
* Copyright 2011-2013 Blender Foundation
|
|
|
|
|
*
|
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
|
*
|
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
*
|
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
|
* limitations under the License.
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
/* Templated common implementation part of all CPU kernels.
|
|
|
|
|
*
|
|
|
|
|
* The idea is that particular .cpp files sets needed optimization flags and
|
|
|
|
|
* simply includes this file without worry of copying actual implementation over.
|
|
|
|
|
*/
|
|
|
|
|
|
2020-03-06 14:15:21 +01:00
|
|
|
// clang-format off
|
Cycles: Make all #include statements relative to cycles source directory
The idea is to make include statements more explicit and obvious where the
file is coming from, additionally reducing chance of wrong header being
picked up.
For example, it was not obvious whether bvh.h was refferring to builder
or traversal, whenter node.h is a generic graph node or a shader node
and cases like that.
Surely this might look obvious for the active developers, but after some
time of not touching the code it becomes less obvious where file is coming
from.
This was briefly mentioned in T50824 and seems @brecht is fine with such
explicitness, but need to agree with all active developers before committing
this.
Please note that this patch is lacking changes related on GPU/OpenCL
support. This will be solved if/when we all agree this is a good idea to move
forward.
Reviewers: brecht, lukasstockner97, maiself, nirved, dingto, juicyfruit, swerner
Reviewed By: lukasstockner97, maiself, nirved, dingto
Subscribers: brecht
Differential Revision: https://developer.blender.org/D2586
2017-03-28 20:39:14 +02:00
|
|
|
#include "kernel/kernel_compat_cpu.h"
|
2017-02-14 06:20:48 -05:00
|
|
|
|
2017-05-16 15:59:57 -04:00
|
|
|
#ifndef KERNEL_STUB
|
|
|
|
|
# ifndef __SPLIT_KERNEL__
|
|
|
|
|
# include "kernel/kernel_math.h"
|
|
|
|
|
# include "kernel/kernel_types.h"
|
|
|
|
|
|
|
|
|
|
# include "kernel/split/kernel_split_data.h"
|
|
|
|
|
# include "kernel/kernel_globals.h"
|
|
|
|
|
|
2018-06-14 17:48:19 +02:00
|
|
|
# include "kernel/kernel_color.h"
|
2017-05-16 15:59:57 -04:00
|
|
|
# include "kernel/kernels/cpu/kernel_cpu_image.h"
|
|
|
|
|
# include "kernel/kernel_film.h"
|
|
|
|
|
# include "kernel/kernel_path.h"
|
|
|
|
|
# include "kernel/kernel_path_branched.h"
|
|
|
|
|
# include "kernel/kernel_bake.h"
|
|
|
|
|
# else
|
|
|
|
|
# include "kernel/split/kernel_split_common.h"
|
|
|
|
|
|
|
|
|
|
# include "kernel/split/kernel_data_init.h"
|
|
|
|
|
# include "kernel/split/kernel_path_init.h"
|
|
|
|
|
# include "kernel/split/kernel_scene_intersect.h"
|
|
|
|
|
# include "kernel/split/kernel_lamp_emission.h"
|
|
|
|
|
# include "kernel/split/kernel_do_volume.h"
|
|
|
|
|
# include "kernel/split/kernel_queue_enqueue.h"
|
|
|
|
|
# include "kernel/split/kernel_indirect_background.h"
|
|
|
|
|
# include "kernel/split/kernel_shader_setup.h"
|
|
|
|
|
# include "kernel/split/kernel_shader_sort.h"
|
|
|
|
|
# include "kernel/split/kernel_shader_eval.h"
|
|
|
|
|
# include "kernel/split/kernel_holdout_emission_blurring_pathtermination_ao.h"
|
|
|
|
|
# include "kernel/split/kernel_subsurface_scatter.h"
|
|
|
|
|
# include "kernel/split/kernel_direct_lighting.h"
|
|
|
|
|
# include "kernel/split/kernel_shadow_blocked_ao.h"
|
|
|
|
|
# include "kernel/split/kernel_shadow_blocked_dl.h"
|
2017-05-29 20:40:26 -04:00
|
|
|
# include "kernel/split/kernel_enqueue_inactive.h"
|
2017-05-16 15:59:57 -04:00
|
|
|
# include "kernel/split/kernel_next_iteration_setup.h"
|
|
|
|
|
# include "kernel/split/kernel_indirect_subsurface.h"
|
|
|
|
|
# include "kernel/split/kernel_buffer_update.h"
|
2020-03-05 12:05:42 +01:00
|
|
|
# include "kernel/split/kernel_adaptive_stopping.h"
|
|
|
|
|
# include "kernel/split/kernel_adaptive_filter_x.h"
|
|
|
|
|
# include "kernel/split/kernel_adaptive_filter_y.h"
|
|
|
|
|
# include "kernel/split/kernel_adaptive_adjust_samples.h"
|
2017-05-16 15:59:57 -04:00
|
|
|
# endif /* __SPLIT_KERNEL__ */
|
2017-02-14 06:20:48 -05:00
|
|
|
#else
|
2017-05-07 14:40:58 +02:00
|
|
|
# define STUB_ASSERT(arch, name) \
|
|
|
|
|
assert(!(#name " kernel stub for architecture " #arch " was called!"))
|
2017-05-16 15:59:57 -04:00
|
|
|
|
|
|
|
|
# ifdef __SPLIT_KERNEL__
|
|
|
|
|
# include "kernel/split/kernel_data_init.h"
|
|
|
|
|
# endif /* __SPLIT_KERNEL__ */
|
|
|
|
|
#endif /* KERNEL_STUB */
|
2020-03-06 14:15:21 +01:00
|
|
|
// clang-format on
|
2017-05-07 14:40:58 +02:00
|
|
|
|
2015-12-30 17:54:02 +05:00
|
|
|
CCL_NAMESPACE_BEGIN
|
|
|
|
|
|
2017-02-14 06:20:48 -05:00
|
|
|
#ifndef __SPLIT_KERNEL__
|
|
|
|
|
|
2015-12-30 17:54:02 +05:00
|
|
|
/* Path Tracing */
|
|
|
|
|
|
|
|
|
|
void KERNEL_FUNCTION_FULL_NAME(path_trace)(
|
|
|
|
|
KernelGlobals *kg, float *buffer, int sample, int x, int y, int offset, int stride)
|
|
|
|
|
{
|
2017-05-07 14:40:58 +02:00
|
|
|
# ifdef KERNEL_STUB
|
|
|
|
|
STUB_ASSERT(KERNEL_ARCH, path_trace);
|
|
|
|
|
# else
|
|
|
|
|
# ifdef __BRANCHED_PATH__
|
2015-12-30 17:54:02 +05:00
|
|
|
if (kernel_data.integrator.branched) {
|
|
|
|
|
kernel_branched_path_trace(kg, buffer, sample, x, y, offset, stride);
|
|
|
|
|
}
|
|
|
|
|
else
|
2017-05-07 14:40:58 +02:00
|
|
|
# endif
|
2015-12-30 17:54:02 +05:00
|
|
|
{
|
2017-09-27 00:39:53 +02:00
|
|
|
kernel_path_trace(kg, buffer, sample, x, y, offset, stride);
|
2015-12-30 17:54:02 +05:00
|
|
|
}
|
2017-05-07 14:40:58 +02:00
|
|
|
# endif /* KERNEL_STUB */
|
2015-12-30 17:54:02 +05:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Film */
|
|
|
|
|
|
|
|
|
|
void KERNEL_FUNCTION_FULL_NAME(convert_to_byte)(KernelGlobals *kg,
|
|
|
|
|
uchar4 *rgba,
|
|
|
|
|
float *buffer,
|
|
|
|
|
float sample_scale,
|
|
|
|
|
int x,
|
|
|
|
|
int y,
|
|
|
|
|
int offset,
|
|
|
|
|
int stride)
|
|
|
|
|
{
|
2017-05-07 14:40:58 +02:00
|
|
|
# ifdef KERNEL_STUB
|
|
|
|
|
STUB_ASSERT(KERNEL_ARCH, convert_to_byte);
|
|
|
|
|
# else
|
2015-12-30 17:54:02 +05:00
|
|
|
kernel_film_convert_to_byte(kg, rgba, buffer, sample_scale, x, y, offset, stride);
|
2017-05-07 14:40:58 +02:00
|
|
|
# endif /* KERNEL_STUB */
|
2015-12-30 17:54:02 +05:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void KERNEL_FUNCTION_FULL_NAME(convert_to_half_float)(KernelGlobals *kg,
|
|
|
|
|
uchar4 *rgba,
|
|
|
|
|
float *buffer,
|
|
|
|
|
float sample_scale,
|
|
|
|
|
int x,
|
|
|
|
|
int y,
|
|
|
|
|
int offset,
|
|
|
|
|
int stride)
|
|
|
|
|
{
|
2017-05-07 14:40:58 +02:00
|
|
|
# ifdef KERNEL_STUB
|
|
|
|
|
STUB_ASSERT(KERNEL_ARCH, convert_to_half_float);
|
|
|
|
|
# else
|
2015-12-30 17:54:02 +05:00
|
|
|
kernel_film_convert_to_half_float(kg, rgba, buffer, sample_scale, x, y, offset, stride);
|
2017-05-07 14:40:58 +02:00
|
|
|
# endif /* KERNEL_STUB */
|
2015-12-30 17:54:02 +05:00
|
|
|
}
|
|
|
|
|
|
Cycles: code refactor to bake using regular render session and tiles
There should be no user visible change from this, except that tile size
now affects performance. The goal here is to simplify bake denoising in
D3099, letting it reuse more denoising tiles and pass code.
A lot of code is now shared with regular rendering, with the two main
differences being that we read some render result passes from the bake API
when starting to render a tile, and call the bake kernel instead of the
path trace kernel.
With this kind of design where Cycles asks for tiles from the bake API,
it should eventually be easier to reduce memory usage, show tiles as
they are baked, or bake multiple passes at once, though there's still
quite some work needed for that.
Reviewers: #cycles
Subscribers: monio, wmatyjewicz, lukasstockner97, michaelknubben
Differential Revision: https://developer.blender.org/D3108
2019-05-10 21:39:58 +02:00
|
|
|
/* Bake */
|
|
|
|
|
|
|
|
|
|
void KERNEL_FUNCTION_FULL_NAME(bake)(
|
|
|
|
|
KernelGlobals *kg, float *buffer, int sample, int x, int y, int offset, int stride)
|
|
|
|
|
{
|
|
|
|
|
# ifdef KERNEL_STUB
|
|
|
|
|
STUB_ASSERT(KERNEL_ARCH, bake);
|
|
|
|
|
# else
|
2020-09-01 19:10:03 +02:00
|
|
|
# ifdef __BAKING__
|
Cycles: code refactor to bake using regular render session and tiles
There should be no user visible change from this, except that tile size
now affects performance. The goal here is to simplify bake denoising in
D3099, letting it reuse more denoising tiles and pass code.
A lot of code is now shared with regular rendering, with the two main
differences being that we read some render result passes from the bake API
when starting to render a tile, and call the bake kernel instead of the
path trace kernel.
With this kind of design where Cycles asks for tiles from the bake API,
it should eventually be easier to reduce memory usage, show tiles as
they are baked, or bake multiple passes at once, though there's still
quite some work needed for that.
Reviewers: #cycles
Subscribers: monio, wmatyjewicz, lukasstockner97, michaelknubben
Differential Revision: https://developer.blender.org/D3108
2019-05-10 21:39:58 +02:00
|
|
|
kernel_bake_evaluate(kg, buffer, sample, x, y, offset, stride);
|
2020-09-01 19:10:03 +02:00
|
|
|
# endif
|
Cycles: code refactor to bake using regular render session and tiles
There should be no user visible change from this, except that tile size
now affects performance. The goal here is to simplify bake denoising in
D3099, letting it reuse more denoising tiles and pass code.
A lot of code is now shared with regular rendering, with the two main
differences being that we read some render result passes from the bake API
when starting to render a tile, and call the bake kernel instead of the
path trace kernel.
With this kind of design where Cycles asks for tiles from the bake API,
it should eventually be easier to reduce memory usage, show tiles as
they are baked, or bake multiple passes at once, though there's still
quite some work needed for that.
Reviewers: #cycles
Subscribers: monio, wmatyjewicz, lukasstockner97, michaelknubben
Differential Revision: https://developer.blender.org/D3108
2019-05-10 21:39:58 +02:00
|
|
|
# endif /* KERNEL_STUB */
|
|
|
|
|
}
|
|
|
|
|
|
2015-12-30 17:54:02 +05:00
|
|
|
/* Shader Evaluate */
|
|
|
|
|
|
|
|
|
|
void KERNEL_FUNCTION_FULL_NAME(shader)(KernelGlobals *kg,
|
|
|
|
|
uint4 *input,
|
|
|
|
|
float4 *output,
|
|
|
|
|
int type,
|
2016-01-15 13:00:56 -02:00
|
|
|
int filter,
|
2015-12-30 17:54:02 +05:00
|
|
|
int i,
|
|
|
|
|
int offset,
|
|
|
|
|
int sample)
|
|
|
|
|
{
|
2017-05-07 14:40:58 +02:00
|
|
|
# ifdef KERNEL_STUB
|
|
|
|
|
STUB_ASSERT(KERNEL_ARCH, shader);
|
|
|
|
|
# else
|
Cycles: code refactor to bake using regular render session and tiles
There should be no user visible change from this, except that tile size
now affects performance. The goal here is to simplify bake denoising in
D3099, letting it reuse more denoising tiles and pass code.
A lot of code is now shared with regular rendering, with the two main
differences being that we read some render result passes from the bake API
when starting to render a tile, and call the bake kernel instead of the
path trace kernel.
With this kind of design where Cycles asks for tiles from the bake API,
it should eventually be easier to reduce memory usage, show tiles as
they are baked, or bake multiple passes at once, though there's still
quite some work needed for that.
Reviewers: #cycles
Subscribers: monio, wmatyjewicz, lukasstockner97, michaelknubben
Differential Revision: https://developer.blender.org/D3108
2019-05-10 21:39:58 +02:00
|
|
|
if (type == SHADER_EVAL_DISPLACE) {
|
2017-10-05 15:17:09 +02:00
|
|
|
kernel_displace_evaluate(kg, input, output, i);
|
|
|
|
|
}
|
2015-12-30 17:54:02 +05:00
|
|
|
else {
|
2017-10-05 15:17:09 +02:00
|
|
|
kernel_background_evaluate(kg, input, output, i);
|
2015-12-30 17:54:02 +05:00
|
|
|
}
|
2017-05-07 14:40:58 +02:00
|
|
|
# endif /* KERNEL_STUB */
|
2015-12-30 17:54:02 +05:00
|
|
|
}
|
|
|
|
|
|
2017-02-14 06:20:48 -05:00
|
|
|
#else /* __SPLIT_KERNEL__ */
|
|
|
|
|
|
|
|
|
|
/* Split Kernel Path Tracing */
|
|
|
|
|
|
2017-05-07 14:40:58 +02:00
|
|
|
# ifdef KERNEL_STUB
|
|
|
|
|
# define DEFINE_SPLIT_KERNEL_FUNCTION(name) \
|
|
|
|
|
void KERNEL_FUNCTION_FULL_NAME(name)(KernelGlobals * kg, KernelData * /*data*/) \
|
|
|
|
|
{ \
|
|
|
|
|
STUB_ASSERT(KERNEL_ARCH, name); \
|
|
|
|
|
}
|
2019-04-17 06:17:24 +02:00
|
|
|
|
2017-05-16 15:59:57 -04:00
|
|
|
# define DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(name, type) \
|
|
|
|
|
void KERNEL_FUNCTION_FULL_NAME(name)(KernelGlobals * kg, KernelData * /*data*/) \
|
|
|
|
|
{ \
|
|
|
|
|
STUB_ASSERT(KERNEL_ARCH, name); \
|
|
|
|
|
}
|
2017-05-07 14:40:58 +02:00
|
|
|
# else
|
|
|
|
|
# define DEFINE_SPLIT_KERNEL_FUNCTION(name) \
|
2017-02-14 06:20:48 -05:00
|
|
|
void KERNEL_FUNCTION_FULL_NAME(name)(KernelGlobals * kg, KernelData * /*data*/) \
|
|
|
|
|
{ \
|
|
|
|
|
kernel_##name(kg); \
|
|
|
|
|
}
|
2019-04-17 06:17:24 +02:00
|
|
|
|
2017-05-16 15:59:57 -04:00
|
|
|
# define DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(name, type) \
|
2017-03-08 13:34:29 +01:00
|
|
|
void KERNEL_FUNCTION_FULL_NAME(name)(KernelGlobals * kg, KernelData * /*data*/) \
|
|
|
|
|
{ \
|
|
|
|
|
ccl_local type locals; \
|
|
|
|
|
kernel_##name(kg, &locals); \
|
|
|
|
|
}
|
2017-05-16 15:59:57 -04:00
|
|
|
# endif /* KERNEL_STUB */
|
2017-03-08 13:34:29 +01:00
|
|
|
|
2017-03-01 01:05:55 -05:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(path_init)
|
2017-02-14 06:20:48 -05:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(scene_intersect)
|
|
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(lamp_emission)
|
2017-03-08 15:42:26 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(do_volume)
|
2017-03-08 13:34:29 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(queue_enqueue, QueueEnqueueLocals)
|
2017-03-08 15:42:26 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(indirect_background)
|
2017-05-03 15:30:45 +02:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(shader_setup, uint)
|
|
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(shader_sort, ShaderSortLocals)
|
|
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(shader_eval)
|
2017-03-08 13:34:29 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(holdout_emission_blurring_pathtermination_ao,
|
|
|
|
|
BackgroundAOLocals)
|
2017-03-20 22:31:54 -04:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(subsurface_scatter)
|
2017-03-08 13:34:29 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(direct_lighting, uint)
|
2017-03-08 17:39:40 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(shadow_blocked_ao)
|
|
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(shadow_blocked_dl)
|
2017-05-29 20:40:26 -04:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(enqueue_inactive, uint)
|
2017-03-08 13:34:29 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(next_iteration_setup, uint)
|
2017-03-08 15:42:26 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(indirect_subsurface)
|
2017-03-08 13:34:29 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION_LOCALS(buffer_update, uint)
|
2020-03-05 12:05:42 +01:00
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(adaptive_stopping)
|
|
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(adaptive_filter_x)
|
|
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(adaptive_filter_y)
|
|
|
|
|
DEFINE_SPLIT_KERNEL_FUNCTION(adaptive_adjust_samples)
|
2017-02-14 06:20:48 -05:00
|
|
|
#endif /* __SPLIT_KERNEL__ */
|
|
|
|
|
|
2017-05-07 14:40:58 +02:00
|
|
|
#undef KERNEL_STUB
|
|
|
|
|
#undef STUB_ASSERT
|
|
|
|
|
#undef KERNEL_ARCH
|
|
|
|
|
|
2015-12-30 17:54:02 +05:00
|
|
|
CCL_NAMESPACE_END
|