- should increase speed with large node setups - enables caching of buffers in the node editor (in the future) - OpenCL part still needs some work
172 lines
5.6 KiB
C++
172 lines
5.6 KiB
C++
/*
|
|
* Copyright 2011, Blender Foundation.
|
|
*
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU General Public License
|
|
* as published by the Free Software Foundation; either version 2
|
|
* of the License, or (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
*
|
|
* Contributor:
|
|
* Jeroen Bakker
|
|
* Monique Dewanchand
|
|
*/
|
|
|
|
#include "COM_WriteBufferOperation.h"
|
|
#include "COM_defines.h"
|
|
#include <stdio.h>
|
|
|
|
WriteBufferOperation::WriteBufferOperation() :NodeOperation()
|
|
{
|
|
this->addInputSocket(COM_DT_COLOR);
|
|
this->memoryProxy = new MemoryProxy();
|
|
this->memoryProxy->setWriteBufferOperation(this);
|
|
this->memoryProxy->setExecutor(NULL);
|
|
this->tree = NULL;
|
|
}
|
|
WriteBufferOperation::~WriteBufferOperation()
|
|
{
|
|
if (this->memoryProxy) {
|
|
delete this->memoryProxy;
|
|
this->memoryProxy = NULL;
|
|
}
|
|
}
|
|
|
|
void WriteBufferOperation::executePixel(float *color, float x, float y, PixelSampler sampler, MemoryBuffer *inputBuffers[])
|
|
{
|
|
input->read(color, x, y, sampler, inputBuffers);
|
|
}
|
|
|
|
void WriteBufferOperation::initExecution()
|
|
{
|
|
this->input = this->getInputOperation(0);
|
|
this->memoryProxy->allocate(this->width, this->height);
|
|
}
|
|
|
|
void WriteBufferOperation::deinitExecution()
|
|
{
|
|
this->input = NULL;
|
|
this->memoryProxy->free();
|
|
}
|
|
|
|
void WriteBufferOperation::executeRegion(rcti *rect, unsigned int tileNumber, MemoryBuffer** memoryBuffers)
|
|
{
|
|
//MemoryBuffer *memoryBuffer = MemoryManager::getMemoryBuffer(this->getMemoryProxy(), tileNumber);
|
|
MemoryBuffer *memoryBuffer = this->memoryProxy->getBuffer();
|
|
float *buffer = memoryBuffer->getBuffer();
|
|
if (this->input->isComplex()) {
|
|
void *data = this->input->initializeTileData(rect, memoryBuffers);
|
|
int x1 = rect->xmin;
|
|
int y1 = rect->ymin;
|
|
int x2 = rect->xmax;
|
|
int y2 = rect->ymax;
|
|
int x;
|
|
int y;
|
|
bool breaked = false;
|
|
for (y = y1 ; y < y2 && (!breaked) ; y++) {
|
|
int offset4 = (y*memoryBuffer->getWidth()+x1)*COM_NUMBER_OF_CHANNELS;
|
|
for (x = x1 ; x < x2; x++) {
|
|
input->read(&(buffer[offset4]), x, y, memoryBuffers, data);
|
|
offset4 +=COM_NUMBER_OF_CHANNELS;
|
|
|
|
}
|
|
if (tree->test_break && tree->test_break(tree->tbh)) {
|
|
breaked = true;
|
|
}
|
|
|
|
}
|
|
if (data) {
|
|
this->input->deinitializeTileData(rect, memoryBuffers, data);
|
|
data = NULL;
|
|
}
|
|
}
|
|
else {
|
|
int x1 = rect->xmin;
|
|
int y1 = rect->ymin;
|
|
int x2 = rect->xmax;
|
|
int y2 = rect->ymax;
|
|
|
|
int x;
|
|
int y;
|
|
bool breaked = false;
|
|
for (y = y1 ; y < y2 && (!breaked) ; y++) {
|
|
int offset4 = (y*memoryBuffer->getWidth()+x1)*COM_NUMBER_OF_CHANNELS;
|
|
for (x = x1 ; x < x2 ; x++) {
|
|
input->read(&(buffer[offset4]), x, y, COM_PS_NEAREST, memoryBuffers);
|
|
offset4 +=COM_NUMBER_OF_CHANNELS;
|
|
}
|
|
if (tree->test_break && tree->test_break(tree->tbh)) {
|
|
breaked = true;
|
|
}
|
|
}
|
|
}
|
|
memoryBuffer->setCreatedState();
|
|
}
|
|
|
|
void WriteBufferOperation::executeOpenCLRegion(cl_context context, cl_program program, cl_command_queue queue, rcti *rect, unsigned int chunkNumber, MemoryBuffer** inputMemoryBuffers)
|
|
{
|
|
MemoryBuffer *outputMemoryBuffer = this->getMemoryProxy()->getBuffer();// @todo wrong implementation needs revision
|
|
float *outputFloatBuffer = outputMemoryBuffer->getBuffer();
|
|
cl_int error;
|
|
/*
|
|
* 1. create cl_mem from outputbuffer
|
|
* 2. call NodeOperation (input) executeOpenCLChunk(.....)
|
|
* 3. schedule readback from opencl to main device (outputbuffer)
|
|
* 4. schedule native callback
|
|
*
|
|
* note: list of cl_mem will be filled by 2, and needs to be cleaned up by 4
|
|
*/
|
|
// STEP 1
|
|
const unsigned int outputBufferWidth = outputMemoryBuffer->getWidth();
|
|
const unsigned int outputBufferHeight = outputMemoryBuffer->getHeight();
|
|
|
|
const cl_image_format imageFormat = {
|
|
CL_RGBA,
|
|
CL_FLOAT
|
|
};
|
|
|
|
cl_mem clOutputBuffer = clCreateImage2D(context, CL_MEM_WRITE_ONLY|CL_MEM_USE_HOST_PTR, &imageFormat, outputBufferWidth, outputBufferHeight, 0, outputFloatBuffer, &error);
|
|
if (error != CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
|
|
// STEP 2
|
|
list<cl_mem> * clMemToCleanUp = new list<cl_mem>();
|
|
clMemToCleanUp->push_back(clOutputBuffer);
|
|
list<cl_kernel> *clKernelsToCleanUp = new list<cl_kernel>();
|
|
|
|
this->input->executeOpenCL(context, program, queue, outputMemoryBuffer, clOutputBuffer, inputMemoryBuffers, clMemToCleanUp, clKernelsToCleanUp);
|
|
|
|
// STEP 3
|
|
|
|
size_t origin[3] = {0,0,0};
|
|
size_t region[3] = {outputBufferWidth,outputBufferHeight,1};
|
|
|
|
error = clEnqueueBarrier(queue);
|
|
if (error != CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
error = clEnqueueReadImage(queue, clOutputBuffer, CL_TRUE, origin, region, 0, 0, outputFloatBuffer, 0, NULL, NULL);
|
|
if (error != CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
// STEP 4
|
|
|
|
while (clMemToCleanUp->size()>0) {
|
|
cl_mem mem = clMemToCleanUp->front();
|
|
error = clReleaseMemObject(mem);
|
|
if (error != CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
clMemToCleanUp->pop_front();
|
|
}
|
|
|
|
while (clKernelsToCleanUp->size()>0) {
|
|
cl_kernel kernel = clKernelsToCleanUp->front();
|
|
error = clReleaseKernel(kernel);
|
|
if (error != CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
clKernelsToCleanUp->pop_front();
|
|
}
|
|
delete clKernelsToCleanUp;
|
|
}
|