/* * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software Foundation, * Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. * * Copyright 2011, Blender Foundation. */ #include "COM_VariableSizeBokehBlurOperation.h" #include "BLI_math.h" #include "COM_ExecutionSystem.h" #include "COM_OpenCLDevice.h" #include "RE_pipeline.h" namespace blender::compositor { VariableSizeBokehBlurOperation::VariableSizeBokehBlurOperation() { this->addInputSocket(DataType::Color); this->addInputSocket(DataType::Color, ResizeMode::None); /* Do not resize the bokeh image. */ this->addInputSocket(DataType::Value); /* Radius. */ #ifdef COM_DEFOCUS_SEARCH /* Inverse search radius optimization structure. */ this->addInputSocket(DataType::Color, ResizeMode::None); #endif this->addOutputSocket(DataType::Color); flags.complex = true; flags.open_cl = true; this->m_inputProgram = nullptr; this->m_inputBokehProgram = nullptr; this->m_inputSizeProgram = nullptr; this->m_maxBlur = 32.0f; this->m_threshold = 1.0f; this->m_do_size_scale = false; #ifdef COM_DEFOCUS_SEARCH this->m_inputSearchProgram = nullptr; #endif } void VariableSizeBokehBlurOperation::initExecution() { this->m_inputProgram = getInputSocketReader(0); this->m_inputBokehProgram = getInputSocketReader(1); this->m_inputSizeProgram = getInputSocketReader(2); #ifdef COM_DEFOCUS_SEARCH this->m_inputSearchProgram = getInputSocketReader(3); #endif QualityStepHelper::initExecution(COM_QH_INCREASE); } struct VariableSizeBokehBlurTileData { MemoryBuffer *color; MemoryBuffer *bokeh; MemoryBuffer *size; int maxBlurScalar; }; void *VariableSizeBokehBlurOperation::initializeTileData(rcti *rect) { VariableSizeBokehBlurTileData *data = new VariableSizeBokehBlurTileData(); data->color = (MemoryBuffer *)this->m_inputProgram->initializeTileData(rect); data->bokeh = (MemoryBuffer *)this->m_inputBokehProgram->initializeTileData(rect); data->size = (MemoryBuffer *)this->m_inputSizeProgram->initializeTileData(rect); rcti rect2; this->determineDependingAreaOfInterest( rect, (ReadBufferOperation *)this->m_inputSizeProgram, &rect2); const float max_dim = MAX2(this->getWidth(), this->getHeight()); const float scalar = this->m_do_size_scale ? (max_dim / 100.0f) : 1.0f; data->maxBlurScalar = (int)(data->size->get_max_value(rect2) * scalar); CLAMP(data->maxBlurScalar, 1.0f, this->m_maxBlur); return data; } void VariableSizeBokehBlurOperation::deinitializeTileData(rcti * /*rect*/, void *data) { VariableSizeBokehBlurTileData *result = (VariableSizeBokehBlurTileData *)data; delete result; } void VariableSizeBokehBlurOperation::executePixel(float output[4], int x, int y, void *data) { VariableSizeBokehBlurTileData *tileData = (VariableSizeBokehBlurTileData *)data; MemoryBuffer *inputProgramBuffer = tileData->color; MemoryBuffer *inputBokehBuffer = tileData->bokeh; MemoryBuffer *inputSizeBuffer = tileData->size; float *inputSizeFloatBuffer = inputSizeBuffer->getBuffer(); float *inputProgramFloatBuffer = inputProgramBuffer->getBuffer(); float readColor[4]; float bokeh[4]; float tempSize[4]; float multiplier_accum[4]; float color_accum[4]; const float max_dim = MAX2(getWidth(), getHeight()); const float scalar = this->m_do_size_scale ? (max_dim / 100.0f) : 1.0f; int maxBlurScalar = tileData->maxBlurScalar; BLI_assert(inputBokehBuffer->getWidth() == COM_BLUR_BOKEH_PIXELS); BLI_assert(inputBokehBuffer->getHeight() == COM_BLUR_BOKEH_PIXELS); #ifdef COM_DEFOCUS_SEARCH float search[4]; this->m_inputSearchProgram->read(search, x / InverseSearchRadiusOperation::DIVIDER, y / InverseSearchRadiusOperation::DIVIDER, nullptr); int minx = search[0]; int miny = search[1]; int maxx = search[2]; int maxy = search[3]; #else int minx = MAX2(x - maxBlurScalar, 0); int miny = MAX2(y - maxBlurScalar, 0); int maxx = MIN2(x + maxBlurScalar, (int)getWidth()); int maxy = MIN2(y + maxBlurScalar, (int)getHeight()); #endif { inputSizeBuffer->readNoCheck(tempSize, x, y); inputProgramBuffer->readNoCheck(readColor, x, y); copy_v4_v4(color_accum, readColor); copy_v4_fl(multiplier_accum, 1.0f); float size_center = tempSize[0] * scalar; const int addXStepValue = QualityStepHelper::getStep(); const int addYStepValue = addXStepValue; const int addXStepColor = addXStepValue * COM_DATA_TYPE_COLOR_CHANNELS; if (size_center > this->m_threshold) { for (int ny = miny; ny < maxy; ny += addYStepValue) { float dy = ny - y; int offsetValueNy = ny * inputSizeBuffer->getWidth(); int offsetValueNxNy = offsetValueNy + (minx); int offsetColorNxNy = offsetValueNxNy * COM_DATA_TYPE_COLOR_CHANNELS; for (int nx = minx; nx < maxx; nx += addXStepValue) { if (nx != x || ny != y) { float size = MIN2(inputSizeFloatBuffer[offsetValueNxNy] * scalar, size_center); if (size > this->m_threshold) { float dx = nx - x; if (size > fabsf(dx) && size > fabsf(dy)) { float uv[2] = { (float)(COM_BLUR_BOKEH_PIXELS / 2) + (dx / size) * (float)((COM_BLUR_BOKEH_PIXELS / 2) - 1), (float)(COM_BLUR_BOKEH_PIXELS / 2) + (dy / size) * (float)((COM_BLUR_BOKEH_PIXELS / 2) - 1), }; inputBokehBuffer->read(bokeh, uv[0], uv[1]); madd_v4_v4v4(color_accum, bokeh, &inputProgramFloatBuffer[offsetColorNxNy]); add_v4_v4(multiplier_accum, bokeh); } } } offsetColorNxNy += addXStepColor; offsetValueNxNy += addXStepValue; } } } output[0] = color_accum[0] / multiplier_accum[0]; output[1] = color_accum[1] / multiplier_accum[1]; output[2] = color_accum[2] / multiplier_accum[2]; output[3] = color_accum[3] / multiplier_accum[3]; /* blend in out values over the threshold, otherwise we get sharp, ugly transitions */ if ((size_center > this->m_threshold) && (size_center < this->m_threshold * 2.0f)) { /* factor from 0-1 */ float fac = (size_center - this->m_threshold) / this->m_threshold; interp_v4_v4v4(output, readColor, output, fac); } } } void VariableSizeBokehBlurOperation::executeOpenCL(OpenCLDevice *device, MemoryBuffer *outputMemoryBuffer, cl_mem clOutputBuffer, MemoryBuffer **inputMemoryBuffers, std::list *clMemToCleanUp, std::list * /*clKernelsToCleanUp*/) { cl_kernel defocusKernel = device->COM_clCreateKernel("defocusKernel", nullptr); cl_int step = this->getStep(); cl_int maxBlur; cl_float threshold = this->m_threshold; MemoryBuffer *sizeMemoryBuffer = this->m_inputSizeProgram->getInputMemoryBuffer( inputMemoryBuffers); const float max_dim = MAX2(getWidth(), getHeight()); cl_float scalar = this->m_do_size_scale ? (max_dim / 100.0f) : 1.0f; maxBlur = (cl_int)min_ff(sizeMemoryBuffer->get_max_value() * scalar, (float)this->m_maxBlur); device->COM_clAttachMemoryBufferToKernelParameter( defocusKernel, 0, -1, clMemToCleanUp, inputMemoryBuffers, this->m_inputProgram); device->COM_clAttachMemoryBufferToKernelParameter( defocusKernel, 1, -1, clMemToCleanUp, inputMemoryBuffers, this->m_inputBokehProgram); device->COM_clAttachMemoryBufferToKernelParameter( defocusKernel, 2, 4, clMemToCleanUp, inputMemoryBuffers, this->m_inputSizeProgram); device->COM_clAttachOutputMemoryBufferToKernelParameter(defocusKernel, 3, clOutputBuffer); device->COM_clAttachMemoryBufferOffsetToKernelParameter(defocusKernel, 5, outputMemoryBuffer); clSetKernelArg(defocusKernel, 6, sizeof(cl_int), &step); clSetKernelArg(defocusKernel, 7, sizeof(cl_int), &maxBlur); clSetKernelArg(defocusKernel, 8, sizeof(cl_float), &threshold); clSetKernelArg(defocusKernel, 9, sizeof(cl_float), &scalar); device->COM_clAttachSizeToKernelParameter(defocusKernel, 10, this); device->COM_clEnqueueRange(defocusKernel, outputMemoryBuffer, 11, this); } void VariableSizeBokehBlurOperation::deinitExecution() { this->m_inputProgram = nullptr; this->m_inputBokehProgram = nullptr; this->m_inputSizeProgram = nullptr; #ifdef COM_DEFOCUS_SEARCH this->m_inputSearchProgram = nullptr; #endif } bool VariableSizeBokehBlurOperation::determineDependingAreaOfInterest( rcti *input, ReadBufferOperation *readOperation, rcti *output) { rcti newInput; rcti bokehInput; const float max_dim = MAX2(getWidth(), getHeight()); const float scalar = this->m_do_size_scale ? (max_dim / 100.0f) : 1.0f; int maxBlurScalar = this->m_maxBlur * scalar; newInput.xmax = input->xmax + maxBlurScalar + 2; newInput.xmin = input->xmin - maxBlurScalar + 2; newInput.ymax = input->ymax + maxBlurScalar - 2; newInput.ymin = input->ymin - maxBlurScalar - 2; bokehInput.xmax = COM_BLUR_BOKEH_PIXELS; bokehInput.xmin = 0; bokehInput.ymax = COM_BLUR_BOKEH_PIXELS; bokehInput.ymin = 0; NodeOperation *operation = getInputOperation(2); if (operation->determineDependingAreaOfInterest(&newInput, readOperation, output)) { return true; } operation = getInputOperation(1); if (operation->determineDependingAreaOfInterest(&bokehInput, readOperation, output)) { return true; } #ifdef COM_DEFOCUS_SEARCH rcti searchInput; searchInput.xmax = (input->xmax / InverseSearchRadiusOperation::DIVIDER) + 1; searchInput.xmin = (input->xmin / InverseSearchRadiusOperation::DIVIDER) - 1; searchInput.ymax = (input->ymax / InverseSearchRadiusOperation::DIVIDER) + 1; searchInput.ymin = (input->ymin / InverseSearchRadiusOperation::DIVIDER) - 1; operation = getInputOperation(3); if (operation->determineDependingAreaOfInterest(&searchInput, readOperation, output)) { return true; } #endif operation = getInputOperation(0); if (operation->determineDependingAreaOfInterest(&newInput, readOperation, output)) { return true; } return false; } void VariableSizeBokehBlurOperation::get_area_of_interest(const int input_idx, const rcti &output_area, rcti &r_input_area) { switch (input_idx) { case IMAGE_INPUT_INDEX: case SIZE_INPUT_INDEX: { const float max_dim = MAX2(getWidth(), getHeight()); const float scalar = m_do_size_scale ? (max_dim / 100.0f) : 1.0f; const int max_blur_scalar = m_maxBlur * scalar; r_input_area.xmax = output_area.xmax + max_blur_scalar + 2; r_input_area.xmin = output_area.xmin - max_blur_scalar - 2; r_input_area.ymax = output_area.ymax + max_blur_scalar + 2; r_input_area.ymin = output_area.ymin - max_blur_scalar - 2; break; } case BOKEH_INPUT_INDEX: { r_input_area = output_area; r_input_area.xmax = r_input_area.xmin + COM_BLUR_BOKEH_PIXELS; r_input_area.ymax = r_input_area.ymin + COM_BLUR_BOKEH_PIXELS; break; } #ifdef COM_DEFOCUS_SEARCH case DEFOCUS_INPUT_INDEX: { r_input_area.xmax = (output_area.xmax / InverseSearchRadiusOperation::DIVIDER) + 1; r_input_area.xmin = (output_area.xmin / InverseSearchRadiusOperation::DIVIDER) - 1; r_input_area.ymax = (output_area.ymax / InverseSearchRadiusOperation::DIVIDER) + 1; r_input_area.ymin = (output_area.ymin / InverseSearchRadiusOperation::DIVIDER) - 1; break; } #endif } } struct PixelData { float multiplier_accum[4]; float color_accum[4]; float threshold; float scalar; float size_center; int max_blur_scalar; int step; MemoryBuffer *bokeh_input; MemoryBuffer *size_input; MemoryBuffer *image_input; int image_width; int image_height; }; static void blur_pixel(int x, int y, PixelData &p) { BLI_assert(p.bokeh_input->getWidth() == COM_BLUR_BOKEH_PIXELS); BLI_assert(p.bokeh_input->getHeight() == COM_BLUR_BOKEH_PIXELS); #ifdef COM_DEFOCUS_SEARCH float search[4]; inputs[DEFOCUS_INPUT_INDEX]->read_elem_checked(x / InverseSearchRadiusOperation::DIVIDER, y / InverseSearchRadiusOperation::DIVIDER, search); const int minx = search[0]; const int miny = search[1]; const int maxx = search[2]; const int maxy = search[3]; #else const int minx = MAX2(x - p.max_blur_scalar, 0); const int miny = MAX2(y - p.max_blur_scalar, 0); const int maxx = MIN2(x + p.max_blur_scalar, p.image_width); const int maxy = MIN2(y + p.max_blur_scalar, p.image_height); #endif const int color_row_stride = p.image_input->row_stride * p.step; const int color_elem_stride = p.image_input->elem_stride * p.step; const int size_row_stride = p.size_input->row_stride * p.step; const int size_elem_stride = p.size_input->elem_stride * p.step; const float *row_color = p.image_input->get_elem(minx, miny); const float *row_size = p.size_input->get_elem(minx, miny); for (int ny = miny; ny < maxy; ny += p.step, row_size += size_row_stride, row_color += color_row_stride) { const float dy = ny - y; const float *size_elem = row_size; const float *color = row_color; for (int nx = minx; nx < maxx; nx += p.step, size_elem += size_elem_stride, color += color_elem_stride) { if (nx == x && ny == y) { continue; } const float size = MIN2(size_elem[0] * p.scalar, p.size_center); if (size <= p.threshold) { continue; } const float dx = nx - x; if (size <= fabsf(dx) || size <= fabsf(dy)) { continue; } /* XXX: There is no way to ensure bokeh input is an actual bokeh with #COM_BLUR_BOKEH_PIXELS * size, anything may be connected. Use the real input size and remove asserts? */ const float u = (float)(COM_BLUR_BOKEH_PIXELS / 2) + (dx / size) * (float)((COM_BLUR_BOKEH_PIXELS / 2) - 1); const float v = (float)(COM_BLUR_BOKEH_PIXELS / 2) + (dy / size) * (float)((COM_BLUR_BOKEH_PIXELS / 2) - 1); float bokeh[4]; p.bokeh_input->read_elem_checked(u, v, bokeh); madd_v4_v4v4(p.color_accum, bokeh, color); add_v4_v4(p.multiplier_accum, bokeh); } } } void VariableSizeBokehBlurOperation::update_memory_buffer_partial(MemoryBuffer *output, const rcti &area, Span inputs) { PixelData p; p.bokeh_input = inputs[BOKEH_INPUT_INDEX]; p.size_input = inputs[SIZE_INPUT_INDEX]; p.image_input = inputs[IMAGE_INPUT_INDEX]; p.step = QualityStepHelper::getStep(); p.threshold = m_threshold; p.image_width = this->getWidth(); p.image_height = this->getHeight(); rcti scalar_area; this->get_area_of_interest(SIZE_INPUT_INDEX, area, scalar_area); BLI_rcti_isect(&scalar_area, &p.size_input->get_rect(), &scalar_area); const float max_size = p.size_input->get_max_value(scalar_area); const float max_dim = MAX2(this->getWidth(), this->getHeight()); p.scalar = m_do_size_scale ? (max_dim / 100.0f) : 1.0f; p.max_blur_scalar = static_cast(max_size * p.scalar); CLAMP(p.max_blur_scalar, 1, m_maxBlur); for (BuffersIterator it = output->iterate_with({p.image_input, p.size_input}, area); !it.is_end(); ++it) { const float *color = it.in(0); const float size = *it.in(1); copy_v4_v4(p.color_accum, color); copy_v4_fl(p.multiplier_accum, 1.0f); p.size_center = size * p.scalar; if (p.size_center > p.threshold) { blur_pixel(it.x, it.y, p); } it.out[0] = p.color_accum[0] / p.multiplier_accum[0]; it.out[1] = p.color_accum[1] / p.multiplier_accum[1]; it.out[2] = p.color_accum[2] / p.multiplier_accum[2]; it.out[3] = p.color_accum[3] / p.multiplier_accum[3]; /* Blend in out values over the threshold, otherwise we get sharp, ugly transitions. */ if ((p.size_center > p.threshold) && (p.size_center < p.threshold * 2.0f)) { /* Factor from 0-1. */ const float fac = (p.size_center - p.threshold) / p.threshold; interp_v4_v4v4(it.out, color, it.out, fac); } } } #ifdef COM_DEFOCUS_SEARCH /* #InverseSearchRadiusOperation. */ InverseSearchRadiusOperation::InverseSearchRadiusOperation() { this->addInputSocket(DataType::Value, ResizeMode::None); /* Radius. */ this->addOutputSocket(DataType::Color); this->flags.complex = true; this->m_inputRadius = nullptr; } void InverseSearchRadiusOperation::initExecution() { this->m_inputRadius = this->getInputSocketReader(0); } void *InverseSearchRadiusOperation::initializeTileData(rcti *rect) { MemoryBuffer *data = new MemoryBuffer(DataType::Color, rect); float *buffer = data->getBuffer(); int x, y; int width = this->m_inputRadius->getWidth(); int height = this->m_inputRadius->getHeight(); float temp[4]; int offset = 0; for (y = rect->ymin; y < rect->ymax; y++) { for (x = rect->xmin; x < rect->xmax; x++) { int rx = x * DIVIDER; int ry = y * DIVIDER; buffer[offset] = MAX2(rx - m_maxBlur, 0); buffer[offset + 1] = MAX2(ry - m_maxBlur, 0); buffer[offset + 2] = MIN2(rx + DIVIDER + m_maxBlur, width); buffer[offset + 3] = MIN2(ry + DIVIDER + m_maxBlur, height); offset += 4; } } # if 0 for (x = rect->xmin; x < rect->xmax; x++) { for (y = rect->ymin; y < rect->ymax; y++) { int rx = x * DIVIDER; int ry = y * DIVIDER; float radius = 0.0f; float maxx = x; float maxy = y; for (int x2 = 0; x2 < DIVIDER; x2++) { for (int y2 = 0; y2 < DIVIDER; y2++) { this->m_inputRadius->read(temp, rx + x2, ry + y2, PixelSampler::Nearest); if (radius < temp[0]) { radius = temp[0]; maxx = x2; maxy = y2; } } } int impactRadius = ceil(radius / DIVIDER); for (int x2 = x - impactRadius; x2 < x + impactRadius; x2++) { for (int y2 = y - impactRadius; y2 < y + impactRadius; y2++) { data->read(temp, x2, y2); temp[0] = MIN2(temp[0], maxx); temp[1] = MIN2(temp[1], maxy); temp[2] = MAX2(temp[2], maxx); temp[3] = MAX2(temp[3], maxy); data->writePixel(x2, y2, temp); } } } } # endif return data; } void InverseSearchRadiusOperation::executePixelChunk(float output[4], int x, int y, void *data) { MemoryBuffer *buffer = (MemoryBuffer *)data; buffer->readNoCheck(output, x, y); } void InverseSearchRadiusOperation::deinitializeTileData(rcti *rect, void *data) { if (data) { MemoryBuffer *mb = (MemoryBuffer *)data; delete mb; } } void InverseSearchRadiusOperation::deinitExecution() { this->m_inputRadius = nullptr; } void InverseSearchRadiusOperation::determineResolution(unsigned int resolution[2], unsigned int preferredResolution[2]) { NodeOperation::determineResolution(resolution, preferredResolution); resolution[0] = resolution[0] / DIVIDER; resolution[1] = resolution[1] / DIVIDER; } bool InverseSearchRadiusOperation::determineDependingAreaOfInterest( rcti *input, ReadBufferOperation *readOperation, rcti *output) { rcti newRect; newRect.ymin = input->ymin * DIVIDER - m_maxBlur; newRect.ymax = input->ymax * DIVIDER + m_maxBlur; newRect.xmin = input->xmin * DIVIDER - m_maxBlur; newRect.xmax = input->xmax * DIVIDER + m_maxBlur; return NodeOperation::determineDependingAreaOfInterest(&newRect, readOperation, output); } #endif } // namespace blender::compositor