Listing the "Blender Foundation" as copyright holder implied the Blender Foundation holds copyright to files which may include work from many developers. While keeping copyright on headers makes sense for isolated libraries, Blender's own code may be refactored or moved between files in a way that makes the per file copyright holders less meaningful. Copyright references to the "Blender Foundation" have been replaced with "Blender Authors", with the exception of `./extern/` since these this contains libraries which are more isolated, any changed to license headers there can be handled on a case-by-case basis. Some directories in `./intern/` have also been excluded: - `./intern/cycles/` it's own `AUTHORS` file is planned. - `./intern/opensubdiv/`. An "AUTHORS" file has been added, using the chromium projects authors file as a template. Design task: #110784 Ref !110783.
141 lines
4.3 KiB
C++
141 lines
4.3 KiB
C++
/* SPDX-FileCopyrightText: 2021 Blender Authors
|
|
*
|
|
* SPDX-License-Identifier: GPL-2.0-or-later */
|
|
|
|
#include "COM_GaussianBlurBaseOperation.h"
|
|
|
|
namespace blender::compositor {
|
|
|
|
GaussianBlurBaseOperation::GaussianBlurBaseOperation(eDimension dim)
|
|
: BlurBaseOperation(DataType::Color)
|
|
{
|
|
gausstab_ = nullptr;
|
|
#if BLI_HAVE_SSE2
|
|
gausstab_sse_ = nullptr;
|
|
#endif
|
|
filtersize_ = 0;
|
|
rad_ = 0.0f;
|
|
dimension_ = dim;
|
|
}
|
|
|
|
void GaussianBlurBaseOperation::init_data()
|
|
{
|
|
BlurBaseOperation::init_data();
|
|
if (execution_model_ == eExecutionModel::FullFrame) {
|
|
rad_ = max_ff(size_ * this->get_blur_size(dimension_), 0.0f);
|
|
rad_ = min_ff(rad_, MAX_GAUSSTAB_RADIUS);
|
|
filtersize_ = min_ii(ceil(rad_), MAX_GAUSSTAB_RADIUS);
|
|
}
|
|
}
|
|
|
|
void GaussianBlurBaseOperation::init_execution()
|
|
{
|
|
BlurBaseOperation::init_execution();
|
|
if (execution_model_ == eExecutionModel::FullFrame) {
|
|
gausstab_ = BlurBaseOperation::make_gausstab(rad_, filtersize_);
|
|
#if BLI_HAVE_SSE2
|
|
gausstab_sse_ = BlurBaseOperation::convert_gausstab_sse(gausstab_, filtersize_);
|
|
#endif
|
|
}
|
|
}
|
|
|
|
void GaussianBlurBaseOperation::deinit_execution()
|
|
{
|
|
BlurBaseOperation::deinit_execution();
|
|
|
|
if (gausstab_) {
|
|
MEM_freeN(gausstab_);
|
|
gausstab_ = nullptr;
|
|
}
|
|
#if BLI_HAVE_SSE2
|
|
if (gausstab_sse_) {
|
|
MEM_freeN(gausstab_sse_);
|
|
gausstab_sse_ = nullptr;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
void GaussianBlurBaseOperation::get_area_of_interest(const int input_idx,
|
|
const rcti &output_area,
|
|
rcti &r_input_area)
|
|
{
|
|
if (input_idx != IMAGE_INPUT_INDEX) {
|
|
BlurBaseOperation::get_area_of_interest(input_idx, output_area, r_input_area);
|
|
return;
|
|
}
|
|
|
|
r_input_area = output_area;
|
|
switch (dimension_) {
|
|
case eDimension::X:
|
|
r_input_area.xmin = output_area.xmin - filtersize_ - 1;
|
|
r_input_area.xmax = output_area.xmax + filtersize_ + 1;
|
|
break;
|
|
case eDimension::Y:
|
|
r_input_area.ymin = output_area.ymin - filtersize_ - 1;
|
|
r_input_area.ymax = output_area.ymax + filtersize_ + 1;
|
|
break;
|
|
}
|
|
}
|
|
|
|
void GaussianBlurBaseOperation::update_memory_buffer_partial(MemoryBuffer *output,
|
|
const rcti &area,
|
|
Span<MemoryBuffer *> inputs)
|
|
{
|
|
MemoryBuffer *input = inputs[IMAGE_INPUT_INDEX];
|
|
const rcti &input_rect = input->get_rect();
|
|
BuffersIterator<float> it = output->iterate_with({input}, area);
|
|
|
|
int min_input_coord = -1;
|
|
int max_input_coord = -1;
|
|
int elem_stride = -1;
|
|
std::function<int()> get_current_coord;
|
|
switch (dimension_) {
|
|
case eDimension::X:
|
|
min_input_coord = input_rect.xmin;
|
|
max_input_coord = input_rect.xmax;
|
|
elem_stride = input->elem_stride;
|
|
get_current_coord = [&] { return it.x; };
|
|
break;
|
|
case eDimension::Y:
|
|
min_input_coord = input_rect.ymin;
|
|
max_input_coord = input_rect.ymax;
|
|
elem_stride = input->row_stride;
|
|
get_current_coord = [&] { return it.y; };
|
|
break;
|
|
}
|
|
|
|
for (; !it.is_end(); ++it) {
|
|
const int coord = get_current_coord();
|
|
const int coord_min = max_ii(coord - filtersize_, min_input_coord);
|
|
const int coord_max = min_ii(coord + filtersize_ + 1, max_input_coord);
|
|
|
|
float ATTR_ALIGN(16) color_accum[4] = {0.0f, 0.0f, 0.0f, 0.0f};
|
|
float multiplier_accum = 0.0f;
|
|
|
|
const int step = QualityStepHelper::get_step();
|
|
const float *in = it.in(0) + (intptr_t(coord_min) - coord) * elem_stride;
|
|
const int in_stride = elem_stride * step;
|
|
int gauss_idx = (coord_min - coord) + filtersize_;
|
|
const int gauss_end = gauss_idx + (coord_max - coord_min);
|
|
#if BLI_HAVE_SSE2
|
|
__m128 accum_r = _mm_load_ps(color_accum);
|
|
for (; gauss_idx < gauss_end; in += in_stride, gauss_idx += step) {
|
|
__m128 reg_a = _mm_load_ps(in);
|
|
reg_a = _mm_mul_ps(reg_a, gausstab_sse_[gauss_idx]);
|
|
accum_r = _mm_add_ps(accum_r, reg_a);
|
|
multiplier_accum += gausstab_[gauss_idx];
|
|
}
|
|
_mm_store_ps(color_accum, accum_r);
|
|
#else
|
|
for (; gauss_idx < gauss_end; in += in_stride, gauss_idx += step) {
|
|
const float multiplier = gausstab_[gauss_idx];
|
|
madd_v4_v4fl(color_accum, in, multiplier);
|
|
multiplier_accum += multiplier;
|
|
}
|
|
#endif
|
|
mul_v4_v4fl(it.out, color_accum, 1.0f / multiplier_accum);
|
|
}
|
|
}
|
|
|
|
} // namespace blender::compositor
|