examples/compute_noop.py

"""
Example compute shader that does ... nothing but copy a value from one
buffer into another.
"""

import ctypes

import wgpu
import wgpu.backend.rs  # Select backend
from wgpu.utils import compute_with_buffers  # Convenience function
from python_shader import python2shader, i32, Array


# %% Shader and data


@python2shader
def compute_shader(input, buffer):
    input.define("index", "GlobalInvocationId", i32)
    buffer.define("data1", 0, Array(i32))
    buffer.define("data2", 1, Array(i32))

    buffer.data2[input.index] = buffer.data1[input.index]


# Create input data as a ctypes array
n = 20
IntArrayType = ctypes.c_int32 * n
data = IntArrayType(*range(n))


# %% The short version, using ctypes arrays

# The first arg is the input data, per binding
# The second arg are the ouput types, per binding
out = compute_with_buffers({0: data}, {1: IntArrayType}, compute_shader, n=n)

# The result is a dict matching the output types
# Select data from buffer at binding 1
result = out[1]
print(result[:])


# %% The short version, using numpy

# import numpy as np
#
# numpy_data = np.arange(n, dtype=np.int32)
#
# data = IntArrayType.from_address(numpy_data.ctypes.data)
# out = compute_with_buffers({0: data}, {1: IntArrayType}, compute_shader, n=n)
# print(np.frombuffer(out[1], dtype=np.int32))


# %% The long version using the wgpu API

# Create device and shader object
adapter = wgpu.requestAdapter(powerPreference="high-performance")
device = adapter.requestDevice(extensions=[], limits=wgpu.GPULimits())
cshader = device.createShaderModule(code=compute_shader)

# Create buffer objects, input buffer is mapped.
buffer1 = device.createBufferMapped(
    size=ctypes.sizeof(data), usage=wgpu.BufferUsage.STORAGE | wgpu.BufferUsage.MAP_READ
)
buffer2 = device.createBuffer(
    size=ctypes.sizeof(data), usage=wgpu.BufferUsage.STORAGE | wgpu.BufferUsage.MAP_READ
)

# Cast buffer array
array1 = IntArrayType.from_buffer(buffer1.mapping)
# With Numpy this would be:
# array1 = np.frombuffer(buffer1.mapping, np.int32)

# Copy data and then unmap
array1[:] = data
buffer1.unmap()

# Setup layout and bindings
binding_layouts = [
    {
        "binding": 0,
        "visibility": wgpu.ShaderStage.COMPUTE,
        "type": wgpu.BindingType.storage_buffer,
    },
    {
        "binding": 1,
        "visibility": wgpu.ShaderStage.COMPUTE,
        "type": wgpu.BindingType.storage_buffer,
    },
]
bindings = [
    {"binding": 0, "resource": {"buffer": buffer1, "offset": 0, "size": buffer1.size},},
    {"binding": 1, "resource": {"buffer": buffer2, "offset": 0, "size": buffer2.size},},
]

# Put everything together
bind_group_layout = device.createBindGroupLayout(bindings=binding_layouts)
pipeline_layout = device.createPipelineLayout(bindGroupLayouts=[bind_group_layout])
bind_group = device.createBindGroup(layout=bind_group_layout, bindings=bindings)

# Create and run the pipeline
compute_pipeline = device.createComputePipeline(
    layout=pipeline_layout, computeStage={"module": cshader, "entryPoint": "main"},
)
command_encoder = device.createCommandEncoder()
compute_pass = command_encoder.beginComputePass()
compute_pass.setPipeline(compute_pipeline)
compute_pass.setBindGroup(0, bind_group, [], 0, 999999)  # last 2 elements not used
compute_pass.dispatch(n, 1, 1)  # x y z
compute_pass.endPass()
device.defaultQueue.submit([command_encoder.finish()])

# Read result
result = buffer2.mapRead()
result = IntArrayType.from_buffer(result)  # cast
print(result[:])

# With Numpy this would be:
# print(np.frombuffer(buffer2.mapRead(), np.int32))