One drawback to trying to predict the number of threads that will be used in the `task_graph` is that we are only sure of the number when the threads are running. Using `BLI_task_parallel_range` allows the driver to choose the best thread distribution through `parallel_reduce`. The benefit is most evident on hardware with fewer cores. This is the result on an 4-core laptop: ||before:|after: |---|---|---| |large_mesh_editing:|Average: 5.203638 FPS|Average: 5.398925 FPS ||rdata 15ms iter 43ms (frame 193ms)|rdata 14ms iter 36ms (frame 187ms) Differential Revision: https://developer.blender.org/D11558
48 lines
1.6 KiB
C++
48 lines
1.6 KiB
C++
/* Apache License, Version 2.0 */
|
|
|
|
#include "testing/testing.h"
|
|
|
|
#include "MEM_guardedalloc.h"
|
|
|
|
#include "GPU_index_buffer.h"
|
|
|
|
#include "gpu_testing.hh"
|
|
|
|
namespace blender::gpu::tests {
|
|
|
|
TEST_F(GPUTest, gpu_index_buffer_subbuilders)
|
|
{
|
|
const uint num_subbuilders = 10;
|
|
const uint verts_per_subbuilders = 100;
|
|
const uint vertex_len = num_subbuilders * verts_per_subbuilders;
|
|
|
|
GPUIndexBufBuilder builder;
|
|
GPU_indexbuf_init(&builder, GPU_PRIM_POINTS, vertex_len, vertex_len);
|
|
|
|
GPUIndexBufBuilder subbuilders[num_subbuilders];
|
|
for (int subbuilder_index = 0; subbuilder_index < num_subbuilders; subbuilder_index++) {
|
|
memcpy(&subbuilders[subbuilder_index], &builder, sizeof(builder));
|
|
}
|
|
|
|
for (int subbuilder_index = 0; subbuilder_index < num_subbuilders; subbuilder_index++) {
|
|
GPUIndexBufBuilder &subbuilder = subbuilders[subbuilder_index];
|
|
for (int subbuilder_vert_index = 0; subbuilder_vert_index < verts_per_subbuilders;
|
|
subbuilder_vert_index++) {
|
|
int vert_index_to_update = subbuilder_index * verts_per_subbuilders + subbuilder_vert_index;
|
|
GPU_indexbuf_set_point_vert(&subbuilder, vert_index_to_update, vert_index_to_update);
|
|
}
|
|
}
|
|
|
|
for (int subbuilder_index = 0; subbuilder_index < num_subbuilders; subbuilder_index++) {
|
|
EXPECT_EQ(builder.index_len, subbuilder_index * verts_per_subbuilders);
|
|
GPU_indexbuf_join(&builder, &subbuilders[subbuilder_index]);
|
|
EXPECT_EQ(builder.index_len, (subbuilder_index + 1) * verts_per_subbuilders);
|
|
}
|
|
|
|
GPUIndexBuf *index_buffer = GPU_indexbuf_build(&builder);
|
|
EXPECT_NE(index_buffer, nullptr);
|
|
GPU_INDEXBUF_DISCARD_SAFE(index_buffer);
|
|
}
|
|
|
|
} // namespace blender::gpu::tests
|