This repository has been archived on 2023-10-09. You can view files and clone it. You cannot open issues or pull requests or push a commit.
Files
blender-archive/source/blender/compositor/operations/COM_GaussianBlurBaseOperation.cc

140 lines
4.3 KiB
C++

/* SPDX-License-Identifier: GPL-2.0-or-later
* Copyright 2021 Blender Foundation. */
#include "COM_GaussianBlurBaseOperation.h"
namespace blender::compositor {
GaussianBlurBaseOperation::GaussianBlurBaseOperation(eDimension dim)
: BlurBaseOperation(DataType::Color)
{
gausstab_ = nullptr;
#ifdef BLI_HAVE_SSE2
gausstab_sse_ = nullptr;
#endif
filtersize_ = 0;
rad_ = 0.0f;
dimension_ = dim;
}
void GaussianBlurBaseOperation::init_data()
{
BlurBaseOperation::init_data();
if (execution_model_ == eExecutionModel::FullFrame) {
rad_ = max_ff(size_ * this->get_blur_size(dimension_), 0.0f);
rad_ = min_ff(rad_, MAX_GAUSSTAB_RADIUS);
filtersize_ = min_ii(ceil(rad_), MAX_GAUSSTAB_RADIUS);
}
}
void GaussianBlurBaseOperation::init_execution()
{
BlurBaseOperation::init_execution();
if (execution_model_ == eExecutionModel::FullFrame) {
gausstab_ = BlurBaseOperation::make_gausstab(rad_, filtersize_);
#ifdef BLI_HAVE_SSE2
gausstab_sse_ = BlurBaseOperation::convert_gausstab_sse(gausstab_, filtersize_);
#endif
}
}
void GaussianBlurBaseOperation::deinit_execution()
{
BlurBaseOperation::deinit_execution();
if (gausstab_) {
MEM_freeN(gausstab_);
gausstab_ = nullptr;
}
#ifdef BLI_HAVE_SSE2
if (gausstab_sse_) {
MEM_freeN(gausstab_sse_);
gausstab_sse_ = nullptr;
}
#endif
}
void GaussianBlurBaseOperation::get_area_of_interest(const int input_idx,
const rcti &output_area,
rcti &r_input_area)
{
if (input_idx != IMAGE_INPUT_INDEX) {
BlurBaseOperation::get_area_of_interest(input_idx, output_area, r_input_area);
return;
}
r_input_area = output_area;
switch (dimension_) {
case eDimension::X:
r_input_area.xmin = output_area.xmin - filtersize_ - 1;
r_input_area.xmax = output_area.xmax + filtersize_ + 1;
break;
case eDimension::Y:
r_input_area.ymin = output_area.ymin - filtersize_ - 1;
r_input_area.ymax = output_area.ymax + filtersize_ + 1;
break;
}
}
void GaussianBlurBaseOperation::update_memory_buffer_partial(MemoryBuffer *output,
const rcti &area,
Span<MemoryBuffer *> inputs)
{
MemoryBuffer *input = inputs[IMAGE_INPUT_INDEX];
const rcti &input_rect = input->get_rect();
BuffersIterator<float> it = output->iterate_with({input}, area);
int min_input_coord = -1;
int max_input_coord = -1;
int elem_stride = -1;
std::function<int()> get_current_coord;
switch (dimension_) {
case eDimension::X:
min_input_coord = input_rect.xmin;
max_input_coord = input_rect.xmax;
elem_stride = input->elem_stride;
get_current_coord = [&] { return it.x; };
break;
case eDimension::Y:
min_input_coord = input_rect.ymin;
max_input_coord = input_rect.ymax;
elem_stride = input->row_stride;
get_current_coord = [&] { return it.y; };
break;
}
for (; !it.is_end(); ++it) {
const int coord = get_current_coord();
const int coord_min = max_ii(coord - filtersize_, min_input_coord);
const int coord_max = min_ii(coord + filtersize_ + 1, max_input_coord);
float ATTR_ALIGN(16) color_accum[4] = {0.0f, 0.0f, 0.0f, 0.0f};
float multiplier_accum = 0.0f;
const int step = QualityStepHelper::get_step();
const float *in = it.in(0) + (intptr_t(coord_min) - coord) * elem_stride;
const int in_stride = elem_stride * step;
int gauss_idx = (coord_min - coord) + filtersize_;
const int gauss_end = gauss_idx + (coord_max - coord_min);
#ifdef BLI_HAVE_SSE2
__m128 accum_r = _mm_load_ps(color_accum);
for (; gauss_idx < gauss_end; in += in_stride, gauss_idx += step) {
__m128 reg_a = _mm_load_ps(in);
reg_a = _mm_mul_ps(reg_a, gausstab_sse_[gauss_idx]);
accum_r = _mm_add_ps(accum_r, reg_a);
multiplier_accum += gausstab_[gauss_idx];
}
_mm_store_ps(color_accum, accum_r);
#else
for (; gauss_idx < gauss_end; in += in_stride, gauss_idx += step) {
const float multiplier = gausstab_[gauss_idx];
madd_v4_v4fl(color_accum, in, multiplier);
multiplier_accum += multiplier;
}
#endif
mul_v4_v4fl(it.out, color_accum, 1.0f / multiplier_accum);
}
}
} // namespace blender::compositor