-
Notifications
You must be signed in to change notification settings - Fork 936
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
by injecting a compute shader that validates the content of the indirect buffer also adds missing indirect buffer offset validation
- Loading branch information
Showing
20 changed files
with
862 additions
and
21 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,197 @@ | ||
use wgpu_test::{gpu_test, FailureCase, GpuTestConfiguration, TestParameters, TestingContext}; | ||
|
||
/// Make sure that the num_workgroups builtin works properly (it requires a workaround on D3D12). | ||
#[gpu_test] | ||
static NUM_WORKGROUPS_BUILTIN: GpuTestConfiguration = GpuTestConfiguration::new() | ||
.parameters( | ||
TestParameters::default() | ||
.downlevel_flags( | ||
wgpu::DownlevelFlags::COMPUTE_SHADERS | wgpu::DownlevelFlags::INDIRECT_EXECUTION, | ||
) | ||
.limits(wgpu::Limits::downlevel_defaults()) | ||
.expect_fail(FailureCase::backend(wgt::Backends::DX12)), | ||
) | ||
.run_async(|ctx| async move { | ||
let num_workgroups = [1, 2, 3]; | ||
let res = run_test(&ctx, &num_workgroups, false).await; | ||
assert_eq!(res, num_workgroups); | ||
}); | ||
|
||
/// Make sure that we discard (don't run) the dispatch if its size exceeds the device limit. | ||
#[gpu_test] | ||
static DISCARD_DISPATCH: GpuTestConfiguration = GpuTestConfiguration::new() | ||
.parameters( | ||
TestParameters::default() | ||
.downlevel_flags( | ||
wgpu::DownlevelFlags::COMPUTE_SHADERS | wgpu::DownlevelFlags::INDIRECT_EXECUTION, | ||
) | ||
.limits(wgpu::Limits { | ||
max_compute_workgroups_per_dimension: 10, | ||
..wgpu::Limits::downlevel_defaults() | ||
}), | ||
) | ||
.run_async(|ctx| async move { | ||
let max = ctx.device.limits().max_compute_workgroups_per_dimension; | ||
|
||
let res = run_test(&ctx, &[max, max, max], false).await; | ||
assert_eq!(res, [max; 3]); | ||
|
||
let res = run_test(&ctx, &[max + 1, 1, 1], false).await; | ||
assert_eq!(res, [0; 3]); | ||
|
||
let res = run_test(&ctx, &[1, max + 1, 1], false).await; | ||
assert_eq!(res, [0; 3]); | ||
|
||
let res = run_test(&ctx, &[1, 1, max + 1], false).await; | ||
assert_eq!(res, [0; 3]); | ||
}); | ||
|
||
/// Make sure that unsetting the bind group set by the validation code works properly. | ||
#[gpu_test] | ||
static UNSET_INTERNAL_BIND_GROUP: GpuTestConfiguration = GpuTestConfiguration::new() | ||
.parameters( | ||
TestParameters::default() | ||
.downlevel_flags( | ||
wgpu::DownlevelFlags::COMPUTE_SHADERS | wgpu::DownlevelFlags::INDIRECT_EXECUTION, | ||
) | ||
.limits(wgpu::Limits::downlevel_defaults()), | ||
) | ||
.run_async(|ctx| async move { | ||
ctx.device.push_error_scope(wgpu::ErrorFilter::Validation); | ||
|
||
let _ = run_test(&ctx, &[0, 0, 0], true).await; | ||
|
||
let error = pollster::block_on(ctx.device.pop_error_scope()); | ||
assert!(error.map_or(false, |error| format!("{error}") | ||
.contains("Expected bind group is missing"))); | ||
}); | ||
|
||
async fn run_test( | ||
ctx: &TestingContext, | ||
num_workgroups: &[u32; 3], | ||
forget_to_set_bind_group: bool, | ||
) -> [u32; 3] { | ||
const SHADER_SRC: &str = " | ||
@group(0) @binding(0) | ||
var<storage, read_write> out: array<u32, 3>; | ||
@compute @workgroup_size(1) | ||
fn main(@builtin(num_workgroups) num_workgroups: vec3<u32>, @builtin(workgroup_id) workgroup_id: vec3<u32>) { | ||
if (all(workgroup_id == vec3<u32>())) { | ||
out[0] = num_workgroups.x; | ||
out[1] = num_workgroups.y; | ||
out[2] = num_workgroups.z; | ||
} | ||
} | ||
"; | ||
|
||
let module = ctx | ||
.device | ||
.create_shader_module(wgpu::ShaderModuleDescriptor { | ||
label: None, | ||
source: wgpu::ShaderSource::Wgsl(SHADER_SRC.into()), | ||
}); | ||
|
||
let pipeline = ctx | ||
.device | ||
.create_compute_pipeline(&wgpu::ComputePipelineDescriptor { | ||
label: None, | ||
layout: None, | ||
module: &module, | ||
entry_point: "main", | ||
compilation_options: Default::default(), | ||
cache: None, | ||
}); | ||
|
||
let out_buffer = ctx.device.create_buffer(&wgpu::BufferDescriptor { | ||
label: None, | ||
size: 12, | ||
usage: wgpu::BufferUsages::STORAGE | wgpu::BufferUsages::COPY_SRC, | ||
mapped_at_creation: false, | ||
}); | ||
|
||
let readback_buffer = ctx.device.create_buffer(&wgpu::BufferDescriptor { | ||
label: None, | ||
size: 12, | ||
usage: wgpu::BufferUsages::COPY_DST | wgpu::BufferUsages::MAP_READ, | ||
mapped_at_creation: false, | ||
}); | ||
|
||
let bind_group = ctx.device.create_bind_group(&wgpu::BindGroupDescriptor { | ||
label: None, | ||
layout: &pipeline.get_bind_group_layout(0), | ||
entries: &[wgpu::BindGroupEntry { | ||
binding: 0, | ||
resource: out_buffer.as_entire_binding(), | ||
}], | ||
}); | ||
|
||
let mut res = None; | ||
|
||
for (indirect_offset, indirect_buffer_size) in [ | ||
// internal src buffer binding size will be buffer.size | ||
(0, 12), | ||
(4, 4 + 12), | ||
(4, 8 + 12), | ||
(256 * 2 - 4 - 12, 256 * 2 - 4), | ||
// internal src buffer binding size will be 256 * 2 + x | ||
(0, 256 * 2 * 2 + 4), | ||
(256, 256 * 2 * 2 + 8), | ||
(256 + 4, 256 * 2 * 2 + 12), | ||
(256 * 2 + 16, 256 * 2 * 2 + 16), | ||
(256 * 2 * 2, 256 * 2 * 2 + 32), | ||
(256 + 12, 256 * 2 * 2 + 64), | ||
] { | ||
let indirect_buffer = ctx.device.create_buffer(&wgpu::BufferDescriptor { | ||
label: None, | ||
size: indirect_buffer_size, | ||
usage: wgpu::BufferUsages::COPY_DST | wgpu::BufferUsages::INDIRECT, | ||
mapped_at_creation: false, | ||
}); | ||
|
||
ctx.queue.write_buffer( | ||
&indirect_buffer, | ||
indirect_offset, | ||
bytemuck::bytes_of(num_workgroups), | ||
); | ||
|
||
let mut encoder = ctx | ||
.device | ||
.create_command_encoder(&wgpu::CommandEncoderDescriptor::default()); | ||
{ | ||
let mut compute_pass = | ||
encoder.begin_compute_pass(&wgpu::ComputePassDescriptor::default()); | ||
compute_pass.set_pipeline(&pipeline); | ||
if !forget_to_set_bind_group { | ||
compute_pass.set_bind_group(0, &bind_group, &[]); | ||
} | ||
compute_pass.dispatch_workgroups_indirect(&indirect_buffer, indirect_offset); | ||
} | ||
|
||
encoder.copy_buffer_to_buffer(&out_buffer, 0, &readback_buffer, 0, 12); | ||
|
||
ctx.queue.submit(Some(encoder.finish())); | ||
|
||
readback_buffer | ||
.slice(..) | ||
.map_async(wgpu::MapMode::Read, |_| {}); | ||
|
||
ctx.async_poll(wgpu::Maintain::wait()) | ||
.await | ||
.panic_on_timeout(); | ||
|
||
let view = readback_buffer.slice(..).get_mapped_range(); | ||
|
||
let current_res = *bytemuck::from_bytes(&view); | ||
drop(view); | ||
readback_buffer.unmap(); | ||
|
||
if let Some(past_res) = res { | ||
assert_eq!(past_res, current_res); | ||
} else { | ||
res = Some(current_res); | ||
} | ||
} | ||
|
||
res.unwrap() | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.