// Copyright 2018 The Dawn Authors
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// See the License for the specific language governing permissions and
// limitations under the License.
#include "tests/DawnTest.h"
#include "utils/DawnHelpers.h"
#include <array>
class ComputeCopyStorageBufferTests : public DawnTest {
static constexpr int kInstances = 4;
static constexpr int kUintsPerInstance = 4;
static constexpr int kNumUints = kInstances * kUintsPerInstance;
void BasicTest(const char* shader);
void ComputeCopyStorageBufferTests::BasicTest(const char* shader) {
auto bgl = utils::MakeBindGroupLayout(
device, {
{0, dawn::ShaderStageBit::Compute, dawn::BindingType::StorageBuffer},
{1, dawn::ShaderStageBit::Compute, dawn::BindingType::StorageBuffer},
// Set up shader and pipeline
auto module = utils::CreateShaderModule(device, dawn::ShaderStage::Compute, shader);
auto pl = utils::MakeBasicPipelineLayout(device, &bgl);
auto pipeline = device.CreateComputePipelineBuilder()
.SetStage(dawn::ShaderStage::Compute, module, "main")
// Set up src storage buffer
dawn::BufferDescriptor srcDesc;
srcDesc.size = kNumUints * sizeof(uint32_t);
srcDesc.usage = dawn::BufferUsageBit::Storage | dawn::BufferUsageBit::TransferSrc |
dawn::Buffer src = device.CreateBuffer(&srcDesc);
std::array<uint32_t, kNumUints> expected;
for (uint32_t i = 0; i < kNumUints; ++i) {
expected[i] = (i + 1u) * 0x11111111u;
src.SetSubData(0, sizeof(expected), reinterpret_cast<const uint8_t*>(;
EXPECT_BUFFER_U32_RANGE_EQ(, src, 0, kNumUints);
auto srcView =
src.CreateBufferViewBuilder().SetExtent(0, kNumUints * sizeof(uint32_t)).GetResult();
// Set up dst storage buffer
dawn::BufferDescriptor dstDesc;
dstDesc.size = kNumUints * sizeof(uint32_t);
dstDesc.usage = dawn::BufferUsageBit::Storage | dawn::BufferUsageBit::TransferSrc |
dawn::Buffer dst = device.CreateBuffer(&dstDesc);
std::array<uint32_t, kNumUints> zero{};
dst.SetSubData(0, sizeof(zero), reinterpret_cast<const uint8_t*>(;
auto dstView =
dst.CreateBufferViewBuilder().SetExtent(0, kNumUints * sizeof(uint32_t)).GetResult();
// Set up bind group and issue dispatch
auto bindGroup = device.CreateBindGroupBuilder()
.SetBufferViews(0, 1, &srcView)
.SetBufferViews(1, 1, &dstView)
auto commands = device.CreateCommandBufferBuilder()
.SetBindGroup(0, bindGroup)
.Dispatch(kInstances, 1, 1)
queue.Submit(1, &commands);
EXPECT_BUFFER_U32_RANGE_EQ(, dst, 0, kNumUints);
// Test that a trivial compute-shader memcpy implementation works.
TEST_P(ComputeCopyStorageBufferTests, SizedArrayOfBasic) {
#version 450
#define kInstances 4
layout(std140, set = 0, binding = 0) buffer Src { uvec4 s[kInstances]; } src;
layout(std140, set = 0, binding = 1) buffer Dst { uvec4 s[kInstances]; } dst;
void main() {
uint index = gl_GlobalInvocationID.x;
if (index >= kInstances) { return; }
dst.s[index] = src.s[index];
// Test that a slightly-less-trivial compute-shader memcpy implementation works.
TEST_P(ComputeCopyStorageBufferTests, SizedArrayOfStruct) {
if (IsD3D12()) {
// TODO( Fails on D3D12. Probably due to a limitation in SPIRV-Cross?
std::cout << "Test skipped on D3D12" << std::endl;
#version 450
#define kInstances 4
struct S {
uvec2 a, b; // kUintsPerInstance = 4
layout(std140, set = 0, binding = 0) buffer Src { S s[kInstances]; } src;
layout(std140, set = 0, binding = 1) buffer Dst { S s[kInstances]; } dst;
void main() {
uint index = gl_GlobalInvocationID.x;
if (index >= kInstances) { return; }
dst.s[index] = src.s[index];
// Test that a trivial compute-shader memcpy implementation works.
TEST_P(ComputeCopyStorageBufferTests, UnsizedArrayOfBasic) {
#version 450
#define kInstances 4
layout(std140, set = 0, binding = 0) buffer Src { uvec4 s[]; } src;
layout(std140, set = 0, binding = 1) buffer Dst { uvec4 s[]; } dst;
void main() {
uint index = gl_GlobalInvocationID.x;
if (index >= kInstances) { return; }
dst.s[index] = src.s[index];
// Test binding a sized array of SSBO descriptors.
// This is disabled because WebGPU doesn't currently have binding arrays (equivalent to
// VkDescriptorSetLayoutBinding::descriptorCount).
TEST_P(ComputeCopyStorageBufferTests, DISABLED_SizedDescriptorArray) {
#version 450
#define kInstances 4
struct S {
uvec2 a, b; // kUintsPerInstance = 4
layout(std140, set = 0, binding = 0) buffer Src { S s; } src[kInstances];
layout(std140, set = 0, binding = 1) buffer Dst { S s; } dst[kInstances];
void main() {
uint index = gl_GlobalInvocationID.x;
if (index >= kInstances) { return; }
dst[index].s = src[index].s;
// Test binding an unsized array of SSBO descriptors.
// TODO( This test may be somewhat wrong. I'm not sure whether this is
// supposed to be possible on the various native APIs.
// Linking on OpenGL fails with "OpenGL requires constant indexes for unsized array access(dst)".
TEST_P(ComputeCopyStorageBufferTests, DISABLED_UnsizedDescriptorArray) {
#version 450
#extension GL_EXT_nonuniform_qualifier : require
#define kInstances 4
struct S {
uvec2 a, b; // kUintsPerInstance = 4
layout(std140, set = 0, binding = 0) buffer Src { S s; } src[];
layout(std140, set = 0, binding = 1) buffer Dst { S s; } dst[];
void main() {
uint index = gl_GlobalInvocationID.x;
if (index >= kInstances) { return; }
dst[index].s = src[index].s;