adding compute pass

This commit is contained in:
2025-09-10 17:46:53 +02:00
parent 287f18402e
commit ff24a19480
17 changed files with 426 additions and 82 deletions

View File

@@ -33,7 +33,14 @@ const char* hlsl_source = HLSL_SOURCE(
int main(void)
{
PulseBackend backend = PulseLoadBackend(PULSE_BACKEND_D3D11, PULSE_SHADER_FORMAT_HLSL_BIT, PULSE_HIGH_DEBUG);
PulseFlags shader_format;
#ifdef PULSE_D3D11_COMPILER_UNAVAILABLE
shader_format = PULSE_SHADER_FORMAT_DXBC_BIT;
#else
shader_format = PULSE_SHADER_FORMAT_HLSL_BIT;
#endif
PulseBackend backend = PulseLoadBackend(PULSE_BACKEND_D3D11, shader_format, PULSE_HIGH_DEBUG);
PulseSetDebugCallback(backend, DebugCallBack);
PulseDevice device = PulseCreateDevice(backend, NULL, 0);
@@ -45,16 +52,30 @@ int main(void)
// GPU computations
{
PulseComputePipelineCreateInfo info = { 0 };
info.code_size = strlen(hlsl_source);
info.code = (const uint8_t*)hlsl_source;
#ifdef PULSE_D3D11_COMPILER_UNAVAILABLE
const uint8_t shader_bytecode[] = {
#include "shader.cso.h"
};
info.code_size = sizeof(shader_bytecode);
info.code = shader_bytecode;
#else
info.code_size = strlen(hlsl_source);
info.code = (const uint8_t*)hlsl_source;
#endif
info.entrypoint = "CSMain";
info.format = PULSE_SHADER_FORMAT_HLSL_BIT;
info.format = shader_format;
info.num_readwrite_storage_buffers = 1;
PulseComputePipeline pipeline = PulseCreateComputePipeline(device, &info);
PulseFence fence = PulseCreateFence(device);
PulseCommandList cmd = PulseRequestCommandList(device, PULSE_COMMAND_LIST_GENERAL);
PulseComputePass pass = PulseBeginComputePass(cmd);
PulseBindStorageBuffers(pass, &buffer, 1);
PulseBindComputePipeline(pass, pipeline);
PulseDispatchComputations(pass, 16, 1, 1);
PulseEndComputePass(pass);
PulseSubmitCommandList(device, cmd, fence);
PulseWaitForFences(device, &fence, 1, true);
@@ -63,6 +84,42 @@ int main(void)
PulseDestroyComputePipeline(device, pipeline);
}
// Get result and read it on CPU
{
PulseBufferCreateInfo staging_buffer_create_info = { 0 };
staging_buffer_create_info.size = BUFFER_SIZE;
staging_buffer_create_info.usage = PULSE_BUFFER_USAGE_TRANSFER_UPLOAD | PULSE_BUFFER_USAGE_TRANSFER_DOWNLOAD;
PulseBuffer staging_buffer = PulseCreateBuffer(device, &staging_buffer_create_info);
PulseFence fence = PulseCreateFence(device);
PulseCommandList cmd = PulseRequestCommandList(device, PULSE_COMMAND_LIST_TRANSFER_ONLY);
PulseBufferRegion src_region = { 0 };
src_region.buffer = buffer;
src_region.size = BUFFER_SIZE;
PulseBufferRegion dst_region = { 0 };
dst_region.buffer = staging_buffer;
dst_region.size = BUFFER_SIZE;
PulseCopyBufferToBuffer(cmd, &src_region, &dst_region);
PulseSubmitCommandList(device, cmd, fence);
PulseWaitForFences(device, &fence, 1, true);
void* ptr;
PulseMapBuffer(staging_buffer, PULSE_MAP_READ, &ptr);
for(uint32_t i = 0; i < BUFFER_SIZE / sizeof(uint32_t); i++)
printf("%d, ", ((int32_t*)ptr)[i]);
puts("");
PulseUnmapBuffer(staging_buffer);
PulseDestroyBuffer(device, staging_buffer);
PulseReleaseCommandList(device, cmd);
PulseDestroyFence(device, fence);
}
PulseDestroyBuffer(device, buffer);
PulseDestroyDevice(device);