294 lines
8.4 KiB
C++
294 lines
8.4 KiB
C++
/*
|
|
* Copyright 2011, Blender Foundation.
|
|
*
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU General Public License
|
|
* as published by the Free Software Foundation; either version 2
|
|
* of the License, or (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
*
|
|
* Contributor:
|
|
* Jeroen Bakker
|
|
* Monique Dewanchand
|
|
*/
|
|
|
|
#include <list>
|
|
#include <stdio.h>
|
|
|
|
#include "BKE_global.h"
|
|
|
|
#include "COM_WorkScheduler.h"
|
|
#include "COM_CPUDevice.h"
|
|
#include "COM_OpenCLDevice.h"
|
|
#include "COM_OpenCLKernels.cl.h"
|
|
#include "OCL_opencl.h"
|
|
|
|
#include "PIL_time.h"
|
|
#include "BLI_threads.h"
|
|
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_NOTHREAD
|
|
#warning COM_CURRENT_THREADING_MODEL COM_TM_NOTHREAD is activated. Use only for debugging.
|
|
#elif COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
#else
|
|
#error COM_CURRENT_THREADING_MODEL No threading model selected
|
|
#endif
|
|
|
|
|
|
/// @brief list of all CPUDevices. for every hardware thread an instance of CPUDevice is created
|
|
static vector<CPUDevice *> cpudevices;
|
|
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
/// @brief list of all thread for every CPUDevice in cpudevices a thread exists
|
|
static ListBase cputhreads;
|
|
/// @brief all scheduled work for the cpu
|
|
static ThreadQueue *cpuqueue;
|
|
static ThreadQueue *gpuqueue;
|
|
#ifdef COM_OPENCL_ENABLED
|
|
static cl_context context;
|
|
static cl_program program;
|
|
/// @brief list of all OpenCLDevices. for every OpenCL GPU device an instance of OpenCLDevice is created
|
|
static vector<OpenCLDevice *> gpudevices;
|
|
/// @brief list of all thread for every GPUDevice in cpudevices a thread exists
|
|
static ListBase gputhreads;
|
|
/// @brief all scheduled work for the gpu
|
|
#ifdef COM_OPENCL_ENABLED
|
|
static bool openclActive = false;
|
|
#endif
|
|
#endif
|
|
#endif
|
|
|
|
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
void *WorkScheduler::thread_execute_cpu(void *data)
|
|
{
|
|
Device *device = (Device *)data;
|
|
WorkPackage *work;
|
|
|
|
while ((work = (WorkPackage *)BLI_thread_queue_pop(cpuqueue))) {
|
|
device->execute(work);
|
|
delete work;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
void *WorkScheduler::thread_execute_gpu(void *data)
|
|
{
|
|
Device *device = (Device *)data;
|
|
WorkPackage *work;
|
|
|
|
while ((work = (WorkPackage *)BLI_thread_queue_pop(gpuqueue))) {
|
|
device->execute(work);
|
|
delete work;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
#endif
|
|
|
|
|
|
|
|
void WorkScheduler::schedule(ExecutionGroup *group, int chunkNumber)
|
|
{
|
|
WorkPackage *package = new WorkPackage(group, chunkNumber);
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_NOTHREAD
|
|
CPUDevice device;
|
|
device.execute(package);
|
|
delete package;
|
|
#elif COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
#ifdef COM_OPENCL_ENABLED
|
|
if (group->isOpenCL() && openclActive) {
|
|
BLI_thread_queue_push(gpuqueue, package);
|
|
}
|
|
else {
|
|
BLI_thread_queue_push(cpuqueue, package);
|
|
}
|
|
#else
|
|
BLI_thread_queue_push(cpuqueue, package);
|
|
#endif
|
|
#endif
|
|
}
|
|
|
|
void WorkScheduler::start(CompositorContext &context)
|
|
{
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
unsigned int index;
|
|
cpuqueue = BLI_thread_queue_init();
|
|
BLI_init_threads(&cputhreads, thread_execute_cpu, cpudevices.size());
|
|
for (index = 0; index < cpudevices.size(); index++) {
|
|
Device *device = cpudevices[index];
|
|
BLI_insert_thread(&cputhreads, device);
|
|
}
|
|
#ifdef COM_OPENCL_ENABLED
|
|
if (context.getHasActiveOpenCLDevices()) {
|
|
gpuqueue = BLI_thread_queue_init();
|
|
BLI_init_threads(&gputhreads, thread_execute_gpu, gpudevices.size());
|
|
for (index = 0; index < gpudevices.size(); index++) {
|
|
Device *device = gpudevices[index];
|
|
BLI_insert_thread(&gputhreads, device);
|
|
}
|
|
openclActive = true;
|
|
}
|
|
else {
|
|
openclActive = false;
|
|
}
|
|
#endif
|
|
#endif
|
|
}
|
|
void WorkScheduler::finish()
|
|
{
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
#ifdef COM_OPENCL_ENABLED
|
|
if (openclActive) {
|
|
BLI_thread_queue_wait_finish(gpuqueue);
|
|
BLI_thread_queue_wait_finish(cpuqueue);
|
|
}
|
|
else {
|
|
BLI_thread_queue_wait_finish(cpuqueue);
|
|
}
|
|
#else
|
|
BLI_thread_queue_wait_finish(cpuqueue);
|
|
#endif
|
|
#endif
|
|
}
|
|
void WorkScheduler::stop()
|
|
{
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
BLI_thread_queue_nowait(cpuqueue);
|
|
BLI_end_threads(&cputhreads);
|
|
BLI_thread_queue_free(cpuqueue);
|
|
cpuqueue = NULL;
|
|
#ifdef COM_OPENCL_ENABLED
|
|
if (openclActive) {
|
|
BLI_thread_queue_nowait(gpuqueue);
|
|
BLI_end_threads(&gputhreads);
|
|
BLI_thread_queue_free(gpuqueue);
|
|
gpuqueue = NULL;
|
|
}
|
|
#endif
|
|
#endif
|
|
}
|
|
|
|
bool WorkScheduler::hasGPUDevices()
|
|
{
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
#ifdef COM_OPENCL_ENABLED
|
|
return gpudevices.size() > 0;
|
|
#else
|
|
return 0;
|
|
#endif
|
|
#else
|
|
return 0;
|
|
#endif
|
|
}
|
|
|
|
extern void clContextError(const char *errinfo, const void *private_info, size_t cb, void *user_data)
|
|
{
|
|
printf("OPENCL error: %s\n", errinfo);
|
|
}
|
|
|
|
void WorkScheduler::initialize()
|
|
{
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
int numberOfCPUThreads = BLI_system_thread_count();
|
|
|
|
for (int index = 0; index < numberOfCPUThreads; index++) {
|
|
CPUDevice *device = new CPUDevice();
|
|
device->initialize();
|
|
cpudevices.push_back(device);
|
|
}
|
|
#ifdef COM_OPENCL_ENABLED
|
|
context = NULL;
|
|
program = NULL;
|
|
if (clCreateContextFromType) {
|
|
cl_uint numberOfPlatforms = 0;
|
|
cl_int error;
|
|
error = clGetPlatformIDs(0, 0, &numberOfPlatforms);
|
|
if (error != CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
if (G.f & G_DEBUG) printf("%d number of platforms\n", numberOfPlatforms);
|
|
cl_platform_id *platforms = new cl_platform_id[numberOfPlatforms];
|
|
error = clGetPlatformIDs(numberOfPlatforms, platforms, 0);
|
|
unsigned int indexPlatform;
|
|
for (indexPlatform = 0; indexPlatform < numberOfPlatforms; indexPlatform++) {
|
|
cl_platform_id platform = platforms[indexPlatform];
|
|
cl_uint numberOfDevices = 0;
|
|
clGetDeviceIDs(platform, CL_DEVICE_TYPE_GPU, 0, 0, &numberOfDevices);
|
|
if (numberOfDevices>0) {
|
|
cl_device_id *cldevices = new cl_device_id[numberOfDevices];
|
|
clGetDeviceIDs(platform, CL_DEVICE_TYPE_GPU, numberOfDevices, cldevices, 0);
|
|
|
|
context = clCreateContext(NULL, numberOfDevices, cldevices, clContextError, NULL, &error);
|
|
if (error != CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
program = clCreateProgramWithSource(context, 1, &clkernelstoh_COM_OpenCLKernels_cl, 0, &error);
|
|
error = clBuildProgram(program, numberOfDevices, cldevices, 0, 0, 0);
|
|
if (error != CL_SUCCESS) {
|
|
cl_int error2;
|
|
size_t ret_val_size = 0;
|
|
printf("CLERROR[%d]: %s\n", error, clewErrorString(error));
|
|
error2 = clGetProgramBuildInfo(program, cldevices[0], CL_PROGRAM_BUILD_LOG, 0, NULL, &ret_val_size);
|
|
if (error2 != CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
char *build_log = new char[ret_val_size + 1];
|
|
error2 = clGetProgramBuildInfo(program, cldevices[0], CL_PROGRAM_BUILD_LOG, ret_val_size, build_log, NULL);
|
|
if (error2 != CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
build_log[ret_val_size] = '\0';
|
|
printf("%s", build_log);
|
|
delete build_log;
|
|
}
|
|
else {
|
|
unsigned int indexDevices;
|
|
for (indexDevices = 0; indexDevices < numberOfDevices; indexDevices++) {
|
|
cl_device_id device = cldevices[indexDevices];
|
|
cl_int vendorID = 0;
|
|
cl_int error = clGetDeviceInfo(device, CL_DEVICE_VENDOR_ID, sizeof(cl_int), &vendorID, NULL);
|
|
if (error!= CL_SUCCESS) { printf("CLERROR[%d]: %s\n", error, clewErrorString(error)); }
|
|
OpenCLDevice *clDevice = new OpenCLDevice(context, device, program, vendorID);
|
|
clDevice->initialize();
|
|
gpudevices.push_back(clDevice);
|
|
}
|
|
}
|
|
delete[] cldevices;
|
|
}
|
|
}
|
|
delete[] platforms;
|
|
}
|
|
#endif
|
|
#endif
|
|
}
|
|
|
|
void WorkScheduler::deinitialize()
|
|
{
|
|
#if COM_CURRENT_THREADING_MODEL == COM_TM_QUEUE
|
|
Device *device;
|
|
while (cpudevices.size() > 0) {
|
|
device = cpudevices.back();
|
|
cpudevices.pop_back();
|
|
device->deinitialize();
|
|
delete device;
|
|
}
|
|
#ifdef COM_OPENCL_ENABLED
|
|
while (gpudevices.size() > 0) {
|
|
device = gpudevices.back();
|
|
gpudevices.pop_back();
|
|
device->deinitialize();
|
|
delete device;
|
|
}
|
|
if (program) {
|
|
clReleaseProgram(program);
|
|
program = NULL;
|
|
}
|
|
if (context) {
|
|
clReleaseContext(context);
|
|
context = NULL;
|
|
}
|
|
#endif
|
|
#endif
|
|
}
|