From 55968e2dcc17682d1f5d7330ee35ecc7c980086d Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Mon, 10 Jun 2024 20:45:55 +0200 Subject: [PATCH 01/15] share timestamp write struct --- deno_webgpu/command_encoder.rs | 4 +- wgpu-core/src/command/compute.rs | 58 ++++++----------------- wgpu-core/src/command/mod.rs | 4 ++ wgpu-core/src/command/render.rs | 35 +++----------- wgpu-core/src/command/timestamp_writes.rs | 25 ++++++++++ wgpu-core/src/device/trace.rs | 4 +- wgpu/src/backend/wgpu_core.rs | 4 +- 7 files changed, 56 insertions(+), 78 deletions(-) create mode 100644 wgpu-core/src/command/timestamp_writes.rs diff --git a/deno_webgpu/command_encoder.rs b/deno_webgpu/command_encoder.rs index 552b084171..177cea28c7 100644 --- a/deno_webgpu/command_encoder.rs +++ b/deno_webgpu/command_encoder.rs @@ -186,7 +186,7 @@ pub fn op_webgpu_command_encoder_begin_render_pass( .get::(timestamp_writes.query_set)?; let query_set = query_set_resource.1; - Some(wgpu_core::command::RenderPassTimestampWrites { + Some(wgpu_core::command::PassTimestampWrites { query_set, beginning_of_pass_write_index: timestamp_writes.beginning_of_pass_write_index, end_of_pass_write_index: timestamp_writes.end_of_pass_write_index, @@ -245,7 +245,7 @@ pub fn op_webgpu_command_encoder_begin_compute_pass( .get::(timestamp_writes.query_set)?; let query_set = query_set_resource.1; - Some(wgpu_core::command::ComputePassTimestampWrites { + Some(wgpu_core::command::PassTimestampWrites { query_set, beginning_of_pass_write_index: timestamp_writes.beginning_of_pass_write_index, end_of_pass_write_index: timestamp_writes.end_of_pass_write_index, diff --git a/wgpu-core/src/command/compute.rs b/wgpu-core/src/command/compute.rs index 73b8838073..62e01b70e7 100644 --- a/wgpu-core/src/command/compute.rs +++ b/wgpu-core/src/command/compute.rs @@ -7,9 +7,9 @@ use crate::{ compute_command::{ArcComputeCommand, ComputeCommand}, end_pipeline_statistics_query, memory_init::{fixup_discarded_surfaces, SurfacesInDiscardState}, - validate_and_begin_pipeline_statistics_query, BasePass, BindGroupStateChange, - CommandBuffer, CommandEncoderError, CommandEncoderStatus, MapPassErr, PassErrorScope, - QueryUseError, StateChange, + validate_and_begin_pipeline_statistics_query, ArcPassTimestampWrites, BasePass, + BindGroupStateChange, CommandBuffer, CommandEncoderError, CommandEncoderStatus, MapPassErr, + PassErrorScope, PassTimestampWrites, QueryUseError, StateChange, }, device::{Device, DeviceError, MissingDownlevelFlags, MissingFeatures}, error::{ErrorFormatter, PrettyError}, @@ -28,10 +28,6 @@ use crate::{ }; use hal::CommandEncoder as _; -#[cfg(feature = "serde")] -use serde::Deserialize; -#[cfg(feature = "serde")] -use serde::Serialize; use thiserror::Error; use wgt::{BufferAddress, DynamicOffset}; @@ -53,7 +49,7 @@ pub struct ComputePass { /// If it is none, this pass is invalid and any operation on it will return an error. parent: Option>>, - timestamp_writes: Option>, + timestamp_writes: Option>, // Resource binding dedupe state. current_bind_groups: BindGroupStateChange, @@ -103,39 +99,17 @@ impl fmt::Debug for ComputePass { } } -/// Describes the writing of timestamp values in a compute pass. -#[derive(Clone, Debug, PartialEq, Eq)] -#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))] -pub struct ComputePassTimestampWrites { - /// The query set to write the timestamps to. - pub query_set: id::QuerySetId, - /// The index of the query set at which a start timestamp of this pass is written, if any. - pub beginning_of_pass_write_index: Option, - /// The index of the query set at which an end timestamp of this pass is written, if any. - pub end_of_pass_write_index: Option, -} - -/// Describes the writing of timestamp values in a compute pass with the query set resolved. -struct ArcComputePassTimestampWrites { - /// The query set to write the timestamps to. - pub query_set: Arc>, - /// The index of the query set at which a start timestamp of this pass is written, if any. - pub beginning_of_pass_write_index: Option, - /// The index of the query set at which an end timestamp of this pass is written, if any. - pub end_of_pass_write_index: Option, -} - #[derive(Clone, Debug, Default)] pub struct ComputePassDescriptor<'a> { pub label: Label<'a>, /// Defines where and when timestamp values will be written for this pass. - pub timestamp_writes: Option<&'a ComputePassTimestampWrites>, + pub timestamp_writes: Option<&'a PassTimestampWrites>, } struct ArcComputePassDescriptor<'a, A: HalApi> { pub label: &'a Label<'a>, /// Defines where and when timestamp values will be written for this pass. - pub timestamp_writes: Option>, + pub timestamp_writes: Option>, } #[derive(Clone, Debug, Error)] @@ -378,7 +352,7 @@ impl Global { return (ComputePass::new(None, arc_desc), Some(e.into())); } - Some(ArcComputePassTimestampWrites { + Some(ArcPassTimestampWrites { query_set, beginning_of_pass_write_index: tw.beginning_of_pass_write_index, end_of_pass_write_index: tw.end_of_pass_write_index, @@ -433,7 +407,7 @@ impl Global { &self, encoder_id: id::CommandEncoderId, base: BasePass, - timestamp_writes: Option<&ComputePassTimestampWrites>, + timestamp_writes: Option<&PassTimestampWrites>, ) -> Result<(), ComputePassError> { let hub = A::hub(self); let scope = PassErrorScope::PassEncoder(encoder_id); @@ -442,7 +416,7 @@ impl Global { let commands = ComputeCommand::resolve_compute_command_ids(A::hub(self), &base.commands)?; let timestamp_writes = if let Some(tw) = timestamp_writes { - Some(ArcComputePassTimestampWrites { + Some(ArcPassTimestampWrites { query_set: hub .query_sets .read() @@ -473,7 +447,7 @@ impl Global { &self, cmd_buf: &CommandBuffer, base: BasePass>, - mut timestamp_writes: Option>, + mut timestamp_writes: Option>, ) -> Result<(), ComputePassError> { profiling::scope!("CommandEncoder::run_compute_pass"); let pass_scope = PassErrorScope::Pass(Some(cmd_buf.as_info().id())); @@ -494,13 +468,11 @@ impl Global { string_data: base.string_data.to_vec(), push_constant_data: base.push_constant_data.to_vec(), }, - timestamp_writes: timestamp_writes - .as_ref() - .map(|tw| ComputePassTimestampWrites { - query_set: tw.query_set.as_info().id(), - beginning_of_pass_write_index: tw.beginning_of_pass_write_index, - end_of_pass_write_index: tw.end_of_pass_write_index, - }), + timestamp_writes: timestamp_writes.as_ref().map(|tw| PassTimestampWrites { + query_set: tw.query_set.as_info().id(), + beginning_of_pass_write_index: tw.beginning_of_pass_write_index, + end_of_pass_write_index: tw.end_of_pass_write_index, + }), }); } diff --git a/wgpu-core/src/command/mod.rs b/wgpu-core/src/command/mod.rs index 844691c7c2..26a7fcd302 100644 --- a/wgpu-core/src/command/mod.rs +++ b/wgpu-core/src/command/mod.rs @@ -10,6 +10,7 @@ mod memory_init; mod query; mod render; mod render_command; +mod timestamp_writes; mod transfer; use std::sync::Arc; @@ -22,6 +23,9 @@ pub use self::{ }; pub(crate) use allocator::CommandAllocator; +pub(crate) use timestamp_writes::ArcPassTimestampWrites; +pub use timestamp_writes::PassTimestampWrites; + use self::memory_init::CommandBufferTextureMemoryActions; use crate::device::{Device, DeviceError}; diff --git a/wgpu-core/src/command/render.rs b/wgpu-core/src/command/render.rs index 133bdad26e..39e61b10e1 100644 --- a/wgpu-core/src/command/render.rs +++ b/wgpu-core/src/command/render.rs @@ -57,7 +57,7 @@ use super::{ memory_init::TextureSurfaceDiscard, CommandBufferTextureMemoryActions, CommandEncoder, QueryResetMap, }; -use super::{DrawKind, Rect}; +use super::{DrawKind, PassTimestampWrites, Rect}; /// Operation to perform to the output attachment at the start of a renderpass. #[repr(C)] @@ -186,29 +186,6 @@ impl RenderPassDepthStencilAttachment { } } -/// Location to write a timestamp to (beginning or end of the pass). -#[repr(C)] -#[derive(Copy, Clone, Debug, Hash, Eq, PartialEq)] -#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))] -#[cfg_attr(feature = "serde", serde(rename_all = "kebab-case"))] -pub enum RenderPassTimestampLocation { - Beginning = 0, - End = 1, -} - -/// Describes the writing of timestamp values in a render pass. -#[repr(C)] -#[derive(Clone, Debug, PartialEq, Eq)] -#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))] -pub struct RenderPassTimestampWrites { - /// The query set to write the timestamp to. - pub query_set: id::QuerySetId, - /// The index of the query set at which a start timestamp of this pass is written, if any. - pub beginning_of_pass_write_index: Option, - /// The index of the query set at which an end timestamp of this pass is written, if any. - pub end_of_pass_write_index: Option, -} - /// Describes the attachments of a render pass. #[derive(Clone, Debug, Default, PartialEq)] pub struct RenderPassDescriptor<'a> { @@ -218,7 +195,7 @@ pub struct RenderPassDescriptor<'a> { /// The depth and stencil attachment of the render pass, if any. pub depth_stencil_attachment: Option<&'a RenderPassDepthStencilAttachment>, /// Defines where and when timestamp values will be written for this pass. - pub timestamp_writes: Option<&'a RenderPassTimestampWrites>, + pub timestamp_writes: Option<&'a PassTimestampWrites>, /// Defines where the occlusion query results will be stored for this pass. pub occlusion_query_set: Option, } @@ -235,7 +212,7 @@ pub struct RenderPass { parent_id: id::CommandEncoderId, color_targets: ArrayVec, { hal::MAX_COLOR_ATTACHMENTS }>, depth_stencil_target: Option, - timestamp_writes: Option, + timestamp_writes: Option, occlusion_query_set_id: Option, // Resource binding dedupe state. @@ -829,7 +806,7 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { hal_label: Option<&str>, color_attachments: &[Option], depth_stencil_attachment: Option<&RenderPassDepthStencilAttachment>, - timestamp_writes: Option<&RenderPassTimestampWrites>, + timestamp_writes: Option<&PassTimestampWrites>, occlusion_query_set: Option>>, encoder: &mut CommandEncoder, trackers: &mut Tracker, @@ -1359,7 +1336,7 @@ impl Global { base: BasePass, color_attachments: &[Option], depth_stencil_attachment: Option<&RenderPassDepthStencilAttachment>, - timestamp_writes: Option<&RenderPassTimestampWrites>, + timestamp_writes: Option<&PassTimestampWrites>, occlusion_query_set_id: Option, ) -> Result<(), RenderPassError> { let pass_scope = PassErrorScope::PassEncoder(encoder_id); @@ -1400,7 +1377,7 @@ impl Global { base: BasePass>, color_attachments: &[Option], depth_stencil_attachment: Option<&RenderPassDepthStencilAttachment>, - timestamp_writes: Option<&RenderPassTimestampWrites>, + timestamp_writes: Option<&PassTimestampWrites>, occlusion_query_set: Option>>, ) -> Result<(), RenderPassError> { profiling::scope!( diff --git a/wgpu-core/src/command/timestamp_writes.rs b/wgpu-core/src/command/timestamp_writes.rs new file mode 100644 index 0000000000..82ab13c6dd --- /dev/null +++ b/wgpu-core/src/command/timestamp_writes.rs @@ -0,0 +1,25 @@ +use std::sync::Arc; + +use crate::{hal_api::HalApi, id}; + +/// Describes the writing of timestamp values in a render or compute pass. +#[derive(Clone, Debug, PartialEq, Eq)] +#[cfg_attr(feature = "serde", derive(serde::Serialize, serde::Deserialize))] +pub struct PassTimestampWrites { + /// The query set to write the timestamps to. + pub query_set: id::QuerySetId, + /// The index of the query set at which a start timestamp of this pass is written, if any. + pub beginning_of_pass_write_index: Option, + /// The index of the query set at which an end timestamp of this pass is written, if any. + pub end_of_pass_write_index: Option, +} + +/// Describes the writing of timestamp values in a render or compute pass with the query set resolved. +pub struct ArcPassTimestampWrites { + /// The query set to write the timestamps to. + pub query_set: Arc>, + /// The index of the query set at which a start timestamp of this pass is written, if any. + pub beginning_of_pass_write_index: Option, + /// The index of the query set at which an end timestamp of this pass is written, if any. + pub end_of_pass_write_index: Option, +} diff --git a/wgpu-core/src/device/trace.rs b/wgpu-core/src/device/trace.rs index 24790103a5..ff4eea47be 100644 --- a/wgpu-core/src/device/trace.rs +++ b/wgpu-core/src/device/trace.rs @@ -179,13 +179,13 @@ pub enum Command { InsertDebugMarker(String), RunComputePass { base: crate::command::BasePass, - timestamp_writes: Option, + timestamp_writes: Option, }, RunRenderPass { base: crate::command::BasePass, target_colors: Vec>, target_depth_stencil: Option, - timestamp_writes: Option, + timestamp_writes: Option, occlusion_query_set_id: Option, }, } diff --git a/wgpu/src/backend/wgpu_core.rs b/wgpu/src/backend/wgpu_core.rs index 57574d8abb..e002b2f257 100644 --- a/wgpu/src/backend/wgpu_core.rs +++ b/wgpu/src/backend/wgpu_core.rs @@ -1913,7 +1913,7 @@ impl crate::Context for ContextWgpuCore { let timestamp_writes = desc.timestamp_writes .as_ref() - .map(|tw| wgc::command::ComputePassTimestampWrites { + .map(|tw| wgc::command::PassTimestampWrites { query_set: tw.query_set.id.into(), beginning_of_pass_write_index: tw.beginning_of_pass_write_index, end_of_pass_write_index: tw.end_of_pass_write_index, @@ -1982,7 +1982,7 @@ impl crate::Context for ContextWgpuCore { let timestamp_writes = desc.timestamp_writes .as_ref() - .map(|tw| wgc::command::RenderPassTimestampWrites { + .map(|tw| wgc::command::PassTimestampWrites { query_set: tw.query_set.id.into(), beginning_of_pass_write_index: tw.beginning_of_pass_write_index, end_of_pass_write_index: tw.end_of_pass_write_index, From 5e36ab10d88d816750f27502f40305671c867350 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sat, 29 Jun 2024 13:30:17 +0200 Subject: [PATCH 02/15] Make name of set_push_constants methods consistently plural --- wgpu-core/src/command/compute.rs | 2 +- wgpu-core/src/command/dyn_compute_pass.rs | 6 +++--- wgpu/src/backend/wgpu_core.rs | 2 +- 3 files changed, 5 insertions(+), 5 deletions(-) diff --git a/wgpu-core/src/command/compute.rs b/wgpu-core/src/command/compute.rs index 62e01b70e7..b5abe6f34e 100644 --- a/wgpu-core/src/command/compute.rs +++ b/wgpu-core/src/command/compute.rs @@ -1076,7 +1076,7 @@ impl Global { Ok(()) } - pub fn compute_pass_set_push_constant( + pub fn compute_pass_set_push_constants( &self, pass: &mut ComputePass, offset: u32, diff --git a/wgpu-core/src/command/dyn_compute_pass.rs b/wgpu-core/src/command/dyn_compute_pass.rs index 0b602b1dbd..ea15e2667d 100644 --- a/wgpu-core/src/command/dyn_compute_pass.rs +++ b/wgpu-core/src/command/dyn_compute_pass.rs @@ -21,7 +21,7 @@ pub trait DynComputePass: std::fmt::Debug + WasmNotSendSync { context: &global::Global, pipeline_id: id::ComputePipelineId, ) -> Result<(), ComputePassError>; - fn set_push_constant( + fn set_push_constants( &mut self, context: &global::Global, offset: u32, @@ -93,13 +93,13 @@ impl DynComputePass for ComputePass { context.compute_pass_set_pipeline(self, pipeline_id) } - fn set_push_constant( + fn set_push_constants( &mut self, context: &global::Global, offset: u32, data: &[u8], ) -> Result<(), ComputePassError> { - context.compute_pass_set_push_constant(self, offset, data) + context.compute_pass_set_push_constants(self, offset, data) } fn dispatch_workgroups( diff --git a/wgpu/src/backend/wgpu_core.rs b/wgpu/src/backend/wgpu_core.rs index e002b2f257..e663f099c4 100644 --- a/wgpu/src/backend/wgpu_core.rs +++ b/wgpu/src/backend/wgpu_core.rs @@ -2438,7 +2438,7 @@ impl crate::Context for ContextWgpuCore { offset: u32, data: &[u8], ) { - if let Err(cause) = pass_data.pass.set_push_constant(&self.0, offset, data) { + if let Err(cause) = pass_data.pass.set_push_constants(&self.0, offset, data) { self.handle_error( &pass_data.error_sink, cause, From bb76e15d2e74a5e43694668f73f9ac0ec56e31d8 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Mon, 10 Jun 2024 15:58:33 +0200 Subject: [PATCH 03/15] remove lifetime bounds of resources passed into render pass --- wgpu/src/backend/webgpu.rs | 2 +- wgpu/src/backend/wgpu_core.rs | 2 +- wgpu/src/context.rs | 6 ++-- wgpu/src/lib.rs | 68 +++++++++++++++++------------------ 4 files changed, 39 insertions(+), 39 deletions(-) diff --git a/wgpu/src/backend/webgpu.rs b/wgpu/src/backend/webgpu.rs index fc727003a7..8e158359c2 100644 --- a/wgpu/src/backend/webgpu.rs +++ b/wgpu/src/backend/webgpu.rs @@ -2570,7 +2570,7 @@ impl crate::context::Context for ContextWebGpu { &self, _encoder: &Self::CommandEncoderId, encoder_data: &Self::CommandEncoderData, - desc: &crate::RenderPassDescriptor<'_, '_>, + desc: &crate::RenderPassDescriptor<'_>, ) -> (Self::RenderPassId, Self::RenderPassData) { let mapped_color_attachments = desc .color_attachments diff --git a/wgpu/src/backend/wgpu_core.rs b/wgpu/src/backend/wgpu_core.rs index e663f099c4..3dbbd92d21 100644 --- a/wgpu/src/backend/wgpu_core.rs +++ b/wgpu/src/backend/wgpu_core.rs @@ -1947,7 +1947,7 @@ impl crate::Context for ContextWgpuCore { &self, encoder: &Self::CommandEncoderId, encoder_data: &Self::CommandEncoderData, - desc: &crate::RenderPassDescriptor<'_, '_>, + desc: &crate::RenderPassDescriptor<'_>, ) -> (Self::RenderPassId, Self::RenderPassData) { if desc.color_attachments.len() > wgc::MAX_COLOR_ATTACHMENTS { self.handle_error_fatal( diff --git a/wgpu/src/context.rs b/wgpu/src/context.rs index cba2dbb14e..7ff2adbaf7 100644 --- a/wgpu/src/context.rs +++ b/wgpu/src/context.rs @@ -470,7 +470,7 @@ pub trait Context: Debug + WasmNotSendSync + Sized { &self, encoder: &Self::CommandEncoderId, encoder_data: &Self::CommandEncoderData, - desc: &RenderPassDescriptor<'_, '_>, + desc: &RenderPassDescriptor<'_>, ) -> (Self::RenderPassId, Self::RenderPassData); fn command_encoder_finish( &self, @@ -1477,7 +1477,7 @@ pub(crate) trait DynContext: Debug + WasmNotSendSync { &self, encoder: &ObjectId, encoder_data: &crate::Data, - desc: &RenderPassDescriptor<'_, '_>, + desc: &RenderPassDescriptor<'_>, ) -> (ObjectId, Box); fn command_encoder_finish( &self, @@ -2799,7 +2799,7 @@ where &self, encoder: &ObjectId, encoder_data: &crate::Data, - desc: &RenderPassDescriptor<'_, '_>, + desc: &RenderPassDescriptor<'_>, ) -> (ObjectId, Box) { let encoder = ::from(*encoder); let encoder_data = downcast_ref(encoder_data); diff --git a/wgpu/src/lib.rs b/wgpu/src/lib.rs index 6670716c8b..6b44f08a8e 100644 --- a/wgpu/src/lib.rs +++ b/wgpu/src/lib.rs @@ -1273,10 +1273,10 @@ impl Drop for CommandEncoder { /// Corresponds to [WebGPU `GPURenderPassEncoder`]( /// https://gpuweb.github.io/gpuweb/#render-pass-encoder). #[derive(Debug)] -pub struct RenderPass<'a> { +pub struct RenderPass<'encoder> { id: ObjectId, data: Box, - parent: &'a mut CommandEncoder, + parent: &'encoder mut CommandEncoder, } /// In-progress recording of a compute pass. @@ -1825,28 +1825,25 @@ static_assertions::assert_impl_all!(BindGroupDescriptor<'_>: Send, Sync); /// /// For use with [`CommandEncoder::begin_render_pass`]. /// -/// Note: separate lifetimes are needed because the texture views (`'tex`) -/// have to live as long as the pass is recorded, while everything else (`'desc`) doesn't. -/// /// Corresponds to [WebGPU `GPURenderPassDescriptor`]( /// https://gpuweb.github.io/gpuweb/#dictdef-gpurenderpassdescriptor). #[derive(Clone, Debug, Default)] -pub struct RenderPassDescriptor<'tex, 'desc> { +pub struct RenderPassDescriptor<'a> { /// Debug label of the render pass. This will show up in graphics debuggers for easy identification. - pub label: Label<'desc>, + pub label: Label<'a>, /// The color attachments of the render pass. - pub color_attachments: &'desc [Option>], + pub color_attachments: &'a [Option>], /// The depth and stencil attachment of the render pass, if any. - pub depth_stencil_attachment: Option>, + pub depth_stencil_attachment: Option>, /// Defines which timestamp values will be written for this pass, and where to write them to. /// /// Requires [`Features::TIMESTAMP_QUERY`] to be enabled. - pub timestamp_writes: Option>, + pub timestamp_writes: Option>, /// Defines where the occlusion query results will be stored for this pass. - pub occlusion_query_set: Option<&'tex QuerySet>, + pub occlusion_query_set: Option<&'a QuerySet>, } #[cfg(send_sync)] -static_assertions::assert_impl_all!(RenderPassDescriptor<'_, '_>: Send, Sync); +static_assertions::assert_impl_all!(RenderPassDescriptor<'_>: Send, Sync); /// Describes how the vertex buffer is interpreted. /// @@ -3892,10 +3889,10 @@ impl CommandEncoder { // See https://github.com/gfx-rs/wgpu/pull/5768 for details // Once this is done, the documentation for `begin_render_pass` and `begin_compute_pass` should // be nearly identical. - pub fn begin_render_pass<'pass>( - &'pass mut self, - desc: &RenderPassDescriptor<'pass, '_>, - ) -> RenderPass<'pass> { + pub fn begin_render_pass<'encoder>( + &'encoder mut self, + desc: &RenderPassDescriptor<'_>, + ) -> RenderPass<'encoder> { let id = self.id.as_ref().unwrap(); let (id, data) = DynContext::command_encoder_begin_render_pass( &*self.context, @@ -4177,7 +4174,7 @@ impl CommandEncoder { } } -impl<'a> RenderPass<'a> { +impl<'encoder> RenderPass<'encoder> { /// Sets the active bind group for a given bind group index. The bind group layout /// in the active pipeline when any `draw_*()` method is called must match the layout of /// this bind group. @@ -4190,7 +4187,7 @@ impl<'a> RenderPass<'a> { pub fn set_bind_group( &mut self, index: u32, - bind_group: &'a BindGroup, + bind_group: &BindGroup, offsets: &[DynamicOffset], ) { DynContext::render_pass_set_bind_group( @@ -4207,7 +4204,7 @@ impl<'a> RenderPass<'a> { /// Sets the active render pipeline. /// /// Subsequent draw calls will exhibit the behavior defined by `pipeline`. - pub fn set_pipeline(&mut self, pipeline: &'a RenderPipeline) { + pub fn set_pipeline(&mut self, pipeline: &RenderPipeline) { DynContext::render_pass_set_pipeline( &*self.parent.context, &mut self.id, @@ -4235,7 +4232,7 @@ impl<'a> RenderPass<'a> { /// /// Subsequent calls to [`draw_indexed`](RenderPass::draw_indexed) on this [`RenderPass`] will /// use `buffer` as the source index buffer. - pub fn set_index_buffer(&mut self, buffer_slice: BufferSlice<'a>, index_format: IndexFormat) { + pub fn set_index_buffer(&mut self, buffer_slice: BufferSlice<'_>, index_format: IndexFormat) { DynContext::render_pass_set_index_buffer( &*self.parent.context, &mut self.id, @@ -4258,7 +4255,7 @@ impl<'a> RenderPass<'a> { /// /// [`draw`]: RenderPass::draw /// [`draw_indexed`]: RenderPass::draw_indexed - pub fn set_vertex_buffer(&mut self, slot: u32, buffer_slice: BufferSlice<'a>) { + pub fn set_vertex_buffer(&mut self, slot: u32, buffer_slice: BufferSlice<'_>) { DynContext::render_pass_set_vertex_buffer( &*self.parent.context, &mut self.id, @@ -4433,7 +4430,7 @@ impl<'a> RenderPass<'a> { /// any use of `@builtin(vertex_index)` or `@builtin(instance_index)` in the vertex shader will have different values. /// /// See details on the individual flags for more information. - pub fn draw_indirect(&mut self, indirect_buffer: &'a Buffer, indirect_offset: BufferAddress) { + pub fn draw_indirect(&mut self, indirect_buffer: &Buffer, indirect_offset: BufferAddress) { DynContext::render_pass_draw_indirect( &*self.parent.context, &mut self.id, @@ -4460,7 +4457,7 @@ impl<'a> RenderPass<'a> { /// See details on the individual flags for more information. pub fn draw_indexed_indirect( &mut self, - indirect_buffer: &'a Buffer, + indirect_buffer: &Buffer, indirect_offset: BufferAddress, ) { DynContext::render_pass_draw_indexed_indirect( @@ -4478,7 +4475,10 @@ impl<'a> RenderPass<'a> { /// /// Commands in the bundle do not inherit this render pass's current render state, and after the /// bundle has executed, the state is **cleared** (reset to defaults, not the previous state). - pub fn execute_bundles>(&mut self, render_bundles: I) { + pub fn execute_bundles<'a, I: IntoIterator>( + &mut self, + render_bundles: I, + ) { let mut render_bundles = render_bundles .into_iter() .map(|rb| (&rb.id, rb.data.as_ref())); @@ -4506,7 +4506,7 @@ impl<'a> RenderPass<'a> { /// It is not affected by changes to the state that are performed after it is called. pub fn multi_draw_indirect( &mut self, - indirect_buffer: &'a Buffer, + indirect_buffer: &Buffer, indirect_offset: BufferAddress, count: u32, ) { @@ -4534,7 +4534,7 @@ impl<'a> RenderPass<'a> { /// It is not affected by changes to the state that are performed after it is called. pub fn multi_draw_indexed_indirect( &mut self, - indirect_buffer: &'a Buffer, + indirect_buffer: &Buffer, indirect_offset: BufferAddress, count: u32, ) { @@ -4551,7 +4551,7 @@ impl<'a> RenderPass<'a> { } /// [`Features::MULTI_DRAW_INDIRECT_COUNT`] must be enabled on the device in order to call these functions. -impl<'a> RenderPass<'a> { +impl<'encoder> RenderPass<'encoder> { /// Dispatches multiple draw calls from the active vertex buffer(s) based on the contents of the `indirect_buffer`. /// The count buffer is read to determine how many draws to issue. /// @@ -4576,9 +4576,9 @@ impl<'a> RenderPass<'a> { /// It is not affected by changes to the state that are performed after it is called. pub fn multi_draw_indirect_count( &mut self, - indirect_buffer: &'a Buffer, + indirect_buffer: &Buffer, indirect_offset: BufferAddress, - count_buffer: &'a Buffer, + count_buffer: &Buffer, count_offset: BufferAddress, max_count: u32, ) { @@ -4623,9 +4623,9 @@ impl<'a> RenderPass<'a> { /// It is not affected by changes to the state that are performed after it is called. pub fn multi_draw_indexed_indirect_count( &mut self, - indirect_buffer: &'a Buffer, + indirect_buffer: &Buffer, indirect_offset: BufferAddress, - count_buffer: &'a Buffer, + count_buffer: &Buffer, count_offset: BufferAddress, max_count: u32, ) { @@ -4645,7 +4645,7 @@ impl<'a> RenderPass<'a> { } /// [`Features::PUSH_CONSTANTS`] must be enabled on the device in order to call these functions. -impl<'a> RenderPass<'a> { +impl<'encoder> RenderPass<'encoder> { /// Set push constant data for subsequent draw calls. /// /// Write the bytes in `data` at offset `offset` within push constant @@ -4699,7 +4699,7 @@ impl<'a> RenderPass<'a> { } /// [`Features::TIMESTAMP_QUERY_INSIDE_PASSES`] must be enabled on the device in order to call these functions. -impl<'a> RenderPass<'a> { +impl<'encoder> RenderPass<'encoder> { /// Issue a timestamp command at this point in the queue. The /// timestamp will be written to the specified query set, at the specified index. /// @@ -4768,7 +4768,7 @@ impl<'a> RenderPass<'a> { } } -impl<'a> Drop for RenderPass<'a> { +impl<'encoder> Drop for RenderPass<'encoder> { fn drop(&mut self) { if !thread::panicking() { self.parent From 25b03ace1dd9ccfa94034fd90c44823d8bf08675 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Mon, 10 Jun 2024 16:02:12 +0200 Subject: [PATCH 04/15] first render pass resource ownership test --- tests/tests/render_pass_ownership.rs | 305 +++++++++++++++++++++++++++ tests/tests/root.rs | 1 + 2 files changed, 306 insertions(+) create mode 100644 tests/tests/render_pass_ownership.rs diff --git a/tests/tests/render_pass_ownership.rs b/tests/tests/render_pass_ownership.rs new file mode 100644 index 0000000000..192bbad7bb --- /dev/null +++ b/tests/tests/render_pass_ownership.rs @@ -0,0 +1,305 @@ +//! Tests that render passes take ownership of resources that are associated with. +//! I.e. once a resource is passed in to a render pass, it can be dropped. +//! +//! TODO: Methods that take resources that weren't tested here: +//! * rpass.set_index_buffer(buffer_slice, index_format) +//! * rpass.set_vertex_buffer(slot, buffer_slice) +//! * rpass.draw_indexed_indirect(indirect_buffer, indirect_offset) +//! * rpass.execute_bundles(render_bundles) +//! * rpass.multi_draw_indirect(indirect_buffer, indirect_offset, count) +//! * rpass.multi_draw_indexed_indirect(indirect_buffer, indirect_offset, count) +//! * rpass.multi_draw_indirect_count +//! * rpass.multi_draw_indexed_indirect_count +//! * rpass.begin_pipeline_statistics_query +//! * rpass.write_timestamp + +use std::num::NonZeroU64; + +use wgpu::util::DeviceExt as _; +use wgpu_test::{gpu_test, GpuTestConfiguration, TestParameters, TestingContext}; + +// Minimal shader with buffer based side effect - only needed to check whether the render pass has executed at all. +const SHADER_SRC: &str = " +@group(0) @binding(0) +var buffer: array; + +var positions: array = array( + vec2f(-1.0, -3.0), + vec2f(-1.0, 1.0), + vec2f(3.0, 1.0) +); + +@vertex +fn vs_main(@builtin(vertex_index) vertex_index: u32) -> @builtin(position) vec4 { + return vec4f(positions[vertex_index], 0.0, 1.0); +} + +@fragment +fn fs_main() -> @location(0) vec4 { + buffer[0] *= 2.0; + return vec4(1.0, 0.0, 1.0, 1.0); +}"; + +#[gpu_test] +static RENDER_PASS_RESOURCE_OWNERSHIP: GpuTestConfiguration = GpuTestConfiguration::new() + .parameters(TestParameters::default().test_features_limits()) + .run_async(render_pass_resource_ownership); + +async fn render_pass_resource_ownership(ctx: TestingContext) { + let ResourceSetup { + gpu_buffer, + cpu_buffer, + buffer_size, + indirect_buffer, + bind_group, + pipeline, + color_attachment_view, + color_attachment_resolve_view, + depth_stencil_view, + } = resource_setup(&ctx); + + let mut encoder = ctx + .device + .create_command_encoder(&wgpu::CommandEncoderDescriptor::default()); + + { + let mut rpass = encoder.begin_render_pass(&wgpu::RenderPassDescriptor { + label: Some("render_pass"), + color_attachments: &[Some(wgpu::RenderPassColorAttachment { + view: &color_attachment_view, + resolve_target: Some(&color_attachment_resolve_view), + ops: wgpu::Operations::default(), + })], + depth_stencil_attachment: Some(wgpu::RenderPassDepthStencilAttachment { + view: &depth_stencil_view, + depth_ops: Some(wgpu::Operations { + load: wgpu::LoadOp::Clear(1.0), + store: wgpu::StoreOp::Store, + }), + stencil_ops: None, + }), + timestamp_writes: None, + occlusion_query_set: None, + }); + + // Drop render pass attachments right away. + drop(color_attachment_view); + drop(color_attachment_resolve_view); + drop(depth_stencil_view); + + rpass.set_pipeline(&pipeline); + rpass.set_bind_group(0, &bind_group, &[]); + rpass.draw_indirect(&indirect_buffer, 0); + + // Now drop all resources we set. Then do a device poll to make sure the resources are really not dropped too early, no matter what. + drop(pipeline); + drop(bind_group); + drop(indirect_buffer); + ctx.async_poll(wgpu::Maintain::wait()) + .await + .panic_on_timeout(); + } + + assert_render_pass_executed_normally(encoder, gpu_buffer, cpu_buffer, buffer_size, ctx).await; +} + +async fn assert_render_pass_executed_normally( + mut encoder: wgpu::CommandEncoder, + gpu_buffer: wgpu::Buffer, + cpu_buffer: wgpu::Buffer, + buffer_size: u64, + ctx: TestingContext, +) { + encoder.copy_buffer_to_buffer(&gpu_buffer, 0, &cpu_buffer, 0, buffer_size); + ctx.queue.submit([encoder.finish()]); + cpu_buffer.slice(..).map_async(wgpu::MapMode::Read, |_| ()); + ctx.async_poll(wgpu::Maintain::wait()) + .await + .panic_on_timeout(); + + let data = cpu_buffer.slice(..).get_mapped_range(); + + let floats: &[f32] = bytemuck::cast_slice(&data); + assert!(floats[0] >= 2.0); + assert!(floats[1] >= 4.0); + assert!(floats[2] >= 6.0); + assert!(floats[3] >= 8.0); +} + +// Setup ------------------------------------------------------------ + +struct ResourceSetup { + gpu_buffer: wgpu::Buffer, + cpu_buffer: wgpu::Buffer, + buffer_size: u64, + + indirect_buffer: wgpu::Buffer, + bind_group: wgpu::BindGroup, + pipeline: wgpu::RenderPipeline, + + color_attachment_view: wgpu::TextureView, + color_attachment_resolve_view: wgpu::TextureView, + depth_stencil_view: wgpu::TextureView, +} + +fn resource_setup(ctx: &TestingContext) -> ResourceSetup { + let sm = ctx + .device + .create_shader_module(wgpu::ShaderModuleDescriptor { + label: Some("shader"), + source: wgpu::ShaderSource::Wgsl(SHADER_SRC.into()), + }); + + let buffer_size = 4 * std::mem::size_of::() as u64; + + let bgl = ctx + .device + .create_bind_group_layout(&wgpu::BindGroupLayoutDescriptor { + label: Some("bind_group_layout"), + entries: &[wgpu::BindGroupLayoutEntry { + binding: 0, + visibility: wgpu::ShaderStages::FRAGMENT, + ty: wgpu::BindingType::Buffer { + ty: wgpu::BufferBindingType::Storage { read_only: false }, + has_dynamic_offset: false, + min_binding_size: NonZeroU64::new(buffer_size), + }, + count: None, + }], + }); + + let gpu_buffer = ctx + .device + .create_buffer_init(&wgpu::util::BufferInitDescriptor { + label: Some("gpu_buffer"), + usage: wgpu::BufferUsages::STORAGE | wgpu::BufferUsages::COPY_SRC, + contents: bytemuck::bytes_of(&[1.0_f32, 2.0, 3.0, 4.0]), + }); + + let cpu_buffer = ctx.device.create_buffer(&wgpu::BufferDescriptor { + label: Some("cpu_buffer"), + size: buffer_size, + usage: wgpu::BufferUsages::COPY_DST | wgpu::BufferUsages::MAP_READ, + mapped_at_creation: false, + }); + + let indirect_buffer = ctx + .device + .create_buffer_init(&wgpu::util::BufferInitDescriptor { + label: Some("gpu_buffer"), + usage: wgpu::BufferUsages::INDIRECT, + contents: wgpu::util::DrawIndirectArgs { + vertex_count: 3, + instance_count: 1, + first_vertex: 0, + first_instance: 0, + } + .as_bytes(), + }); + + let bind_group = ctx.device.create_bind_group(&wgpu::BindGroupDescriptor { + label: Some("bind_group"), + layout: &bgl, + entries: &[wgpu::BindGroupEntry { + binding: 0, + resource: gpu_buffer.as_entire_binding(), + }], + }); + + let pipeline_layout = ctx + .device + .create_pipeline_layout(&wgpu::PipelineLayoutDescriptor { + label: Some("pipeline_layout"), + bind_group_layouts: &[&bgl], + push_constant_ranges: &[], + }); + + let target_size = wgpu::Extent3d { + width: 4, + height: 4, + depth_or_array_layers: 1, + }; + let target_msaa = 4; + let target_format = wgpu::TextureFormat::Bgra8UnormSrgb; + + let target_desc = wgpu::TextureDescriptor { + label: Some("target_tex"), + size: target_size, + mip_level_count: 1, + sample_count: target_msaa, + dimension: wgpu::TextureDimension::D2, + format: target_format, + usage: wgpu::TextureUsages::RENDER_ATTACHMENT, + view_formats: &[target_format], + }; + let target_tex = ctx.device.create_texture(&target_desc); + let target_tex_resolve = ctx.device.create_texture(&wgpu::TextureDescriptor { + label: Some("target_resolve"), + sample_count: 1, + ..target_desc + }); + + let color_attachment_view = target_tex.create_view(&wgpu::TextureViewDescriptor::default()); + let color_attachment_resolve_view = + target_tex_resolve.create_view(&wgpu::TextureViewDescriptor::default()); + + let depth_stencil_format = wgpu::TextureFormat::Depth32Float; + let depth_stencil = ctx.device.create_texture(&wgpu::TextureDescriptor { + label: Some("depth_stencil"), + format: depth_stencil_format, + view_formats: &[depth_stencil_format], + ..target_desc + }); + let depth_stencil_view = depth_stencil.create_view(&wgpu::TextureViewDescriptor::default()); + + let pipeline = ctx + .device + .create_render_pipeline(&wgpu::RenderPipelineDescriptor { + label: Some("pipeline"), + layout: Some(&pipeline_layout), + vertex: wgpu::VertexState { + module: &sm, + entry_point: "vs_main", + compilation_options: Default::default(), + buffers: &[], + }, + fragment: Some(wgpu::FragmentState { + module: &sm, + entry_point: "fs_main", + compilation_options: Default::default(), + targets: &[Some(target_format.into())], + }), + primitive: wgpu::PrimitiveState { + topology: wgpu::PrimitiveTopology::TriangleStrip, + strip_index_format: Some(wgpu::IndexFormat::Uint32), + ..Default::default() + }, + depth_stencil: Some(wgpu::DepthStencilState { + format: depth_stencil_format, + depth_write_enabled: true, + depth_compare: wgpu::CompareFunction::LessEqual, + stencil: wgpu::StencilState::default(), + bias: wgpu::DepthBiasState::default(), + }), + multisample: wgpu::MultisampleState { + count: target_msaa, + mask: !0, + alpha_to_coverage_enabled: false, + }, + multiview: None, + cache: None, + }); + + ResourceSetup { + gpu_buffer, + cpu_buffer, + buffer_size, + indirect_buffer, + bind_group, + pipeline, + + color_attachment_view, + color_attachment_resolve_view, + depth_stencil_view, + } +} diff --git a/tests/tests/root.rs b/tests/tests/root.rs index 1cb5b56c7c..159c22d046 100644 --- a/tests/tests/root.rs +++ b/tests/tests/root.rs @@ -29,6 +29,7 @@ mod poll; mod push_constants; mod query_set; mod queue_transfer; +mod render_pass_ownership; mod resource_descriptor_accessor; mod resource_error; mod scissor_tests; From 733121deb2bb0d3a3e88b7b89d4ebd35d4519cd2 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sun, 16 Jun 2024 11:06:59 +0200 Subject: [PATCH 05/15] introduce dynrenderpass & immediately create ArcCommands and take ownership of resources passed on pass creation --- wgpu-core/src/command/compute.rs | 4 +- wgpu-core/src/command/dyn_render_pass.rs | 458 ++++++++++++ wgpu-core/src/command/mod.rs | 34 +- wgpu-core/src/command/render.rs | 873 +++++++++++++++-------- wgpu-core/src/device/mod.rs | 9 - wgpu/src/backend/wgpu_core.rs | 196 +++-- 6 files changed, 1150 insertions(+), 424 deletions(-) create mode 100644 wgpu-core/src/command/dyn_render_pass.rs diff --git a/wgpu-core/src/command/compute.rs b/wgpu-core/src/command/compute.rs index b5abe6f34e..36b2413e68 100644 --- a/wgpu-core/src/command/compute.rs +++ b/wgpu-core/src/command/compute.rs @@ -344,7 +344,9 @@ impl Global { let Ok(query_set) = hub.query_sets.read().get_owned(tw.query_set) else { return ( ComputePass::new(None, arc_desc), - Some(CommandEncoderError::InvalidTimestampWritesQuerySetId), + Some(CommandEncoderError::InvalidTimestampWritesQuerySetId( + tw.query_set, + )), ); }; diff --git a/wgpu-core/src/command/dyn_render_pass.rs b/wgpu-core/src/command/dyn_render_pass.rs new file mode 100644 index 0000000000..7ad79262b3 --- /dev/null +++ b/wgpu-core/src/command/dyn_render_pass.rs @@ -0,0 +1,458 @@ +use wgt::WasmNotSendSync; + +use crate::{global, hal_api::HalApi, id}; + +use super::{RenderPass, RenderPassError}; + +/// Trait for type erasing RenderPass. +// TODO(#5124): wgpu-core's RenderPass trait should not be hal type dependent. +// Practically speaking this allows us merge gfx_select with type erasure: +// The alternative would be to introduce RenderPassId which then first needs to be looked up and then dispatch via gfx_select. +pub trait DynRenderPass: std::fmt::Debug + WasmNotSendSync { + fn set_bind_group( + &mut self, + context: &global::Global, + index: u32, + bind_group_id: id::BindGroupId, + offsets: &[wgt::DynamicOffset], + ) -> Result<(), RenderPassError>; + fn set_index_buffer( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + index_format: wgt::IndexFormat, + offset: wgt::BufferAddress, + size: Option, + ) -> Result<(), RenderPassError>; + fn set_vertex_buffer( + &mut self, + context: &global::Global, + slot: u32, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + size: Option, + ) -> Result<(), RenderPassError>; + fn set_pipeline( + &mut self, + context: &global::Global, + pipeline_id: id::RenderPipelineId, + ) -> Result<(), RenderPassError>; + fn set_push_constants( + &mut self, + context: &global::Global, + stages: wgt::ShaderStages, + offset: u32, + data: &[u8], + ) -> Result<(), RenderPassError>; + fn draw( + &mut self, + context: &global::Global, + vertex_count: u32, + instance_count: u32, + first_vertex: u32, + first_instance: u32, + ) -> Result<(), RenderPassError>; + fn draw_indexed( + &mut self, + context: &global::Global, + index_count: u32, + instance_count: u32, + first_index: u32, + base_vertex: i32, + first_instance: u32, + ) -> Result<(), RenderPassError>; + fn draw_indirect( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + ) -> Result<(), RenderPassError>; + fn draw_indexed_indirect( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + ) -> Result<(), RenderPassError>; + fn multi_draw_indirect( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + count: u32, + ) -> Result<(), RenderPassError>; + fn multi_draw_indexed_indirect( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + count: u32, + ) -> Result<(), RenderPassError>; + fn multi_draw_indirect_count( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + count_buffer_id: id::BufferId, + count_buffer_offset: wgt::BufferAddress, + max_count: u32, + ) -> Result<(), RenderPassError>; + fn multi_draw_indexed_indirect_count( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + count_buffer_id: id::BufferId, + count_buffer_offset: wgt::BufferAddress, + max_count: u32, + ) -> Result<(), RenderPassError>; + fn set_blend_constant( + &mut self, + context: &global::Global, + color: wgt::Color, + ) -> Result<(), RenderPassError>; + fn set_scissor_rect( + &mut self, + context: &global::Global, + x: u32, + y: u32, + width: u32, + height: u32, + ) -> Result<(), RenderPassError>; + fn set_viewport( + &mut self, + context: &global::Global, + x: f32, + y: f32, + width: f32, + height: f32, + min_depth: f32, + max_depth: f32, + ) -> Result<(), RenderPassError>; + fn set_stencil_reference( + &mut self, + context: &global::Global, + reference: u32, + ) -> Result<(), RenderPassError>; + fn push_debug_group( + &mut self, + context: &global::Global, + label: &str, + color: u32, + ) -> Result<(), RenderPassError>; + fn pop_debug_group(&mut self, context: &global::Global) -> Result<(), RenderPassError>; + fn insert_debug_marker( + &mut self, + context: &global::Global, + label: &str, + color: u32, + ) -> Result<(), RenderPassError>; + fn write_timestamp( + &mut self, + context: &global::Global, + query_set_id: id::QuerySetId, + query_index: u32, + ) -> Result<(), RenderPassError>; + fn begin_occlusion_query( + &mut self, + context: &global::Global, + query_index: u32, + ) -> Result<(), RenderPassError>; + fn end_occlusion_query(&mut self, context: &global::Global) -> Result<(), RenderPassError>; + fn begin_pipeline_statistics_query( + &mut self, + context: &global::Global, + query_set_id: id::QuerySetId, + query_index: u32, + ) -> Result<(), RenderPassError>; + fn end_pipeline_statistics_query( + &mut self, + context: &global::Global, + ) -> Result<(), RenderPassError>; + fn execute_bundles( + &mut self, + context: &global::Global, + bundles: &[id::RenderBundleId], + ) -> Result<(), RenderPassError>; + fn end(&mut self, context: &global::Global) -> Result<(), RenderPassError>; + + fn label(&self) -> Option<&str>; +} + +impl DynRenderPass for RenderPass { + fn set_index_buffer( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + index_format: wgt::IndexFormat, + offset: wgt::BufferAddress, + size: Option, + ) -> Result<(), RenderPassError> { + context.render_pass_set_index_buffer(self, buffer_id, index_format, offset, size) + } + + fn set_vertex_buffer( + &mut self, + context: &global::Global, + slot: u32, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + size: Option, + ) -> Result<(), RenderPassError> { + context.render_pass_set_vertex_buffer(self, slot, buffer_id, offset, size) + } + + fn set_bind_group( + &mut self, + context: &global::Global, + index: u32, + bind_group_id: id::BindGroupId, + offsets: &[wgt::DynamicOffset], + ) -> Result<(), RenderPassError> { + context.render_pass_set_bind_group(self, index, bind_group_id, offsets) + } + + fn set_pipeline( + &mut self, + context: &global::Global, + pipeline_id: id::RenderPipelineId, + ) -> Result<(), RenderPassError> { + context.render_pass_set_pipeline(self, pipeline_id) + } + + fn set_push_constants( + &mut self, + context: &global::Global, + stages: wgt::ShaderStages, + offset: u32, + data: &[u8], + ) -> Result<(), RenderPassError> { + context.render_pass_set_push_constants(self, stages, offset, data) + } + + fn draw( + &mut self, + context: &global::Global, + vertex_count: u32, + instance_count: u32, + first_vertex: u32, + first_instance: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_draw( + self, + vertex_count, + instance_count, + first_vertex, + first_instance, + ) + } + + fn draw_indexed( + &mut self, + context: &global::Global, + index_count: u32, + instance_count: u32, + first_index: u32, + base_vertex: i32, + first_instance: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_draw_indexed( + self, + index_count, + instance_count, + first_index, + base_vertex, + first_instance, + ) + } + + fn draw_indirect( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + ) -> Result<(), RenderPassError> { + context.render_pass_draw_indirect(self, buffer_id, offset) + } + + fn draw_indexed_indirect( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + ) -> Result<(), RenderPassError> { + context.render_pass_draw_indexed_indirect(self, buffer_id, offset) + } + + fn multi_draw_indirect( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + count: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_multi_draw_indirect(self, buffer_id, offset, count) + } + + fn multi_draw_indexed_indirect( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + count: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_multi_draw_indexed_indirect(self, buffer_id, offset, count) + } + + fn multi_draw_indirect_count( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + count_buffer_id: id::BufferId, + count_buffer_offset: wgt::BufferAddress, + max_count: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_multi_draw_indirect_count( + self, + buffer_id, + offset, + count_buffer_id, + count_buffer_offset, + max_count, + ) + } + + fn multi_draw_indexed_indirect_count( + &mut self, + context: &global::Global, + buffer_id: id::BufferId, + offset: wgt::BufferAddress, + count_buffer_id: id::BufferId, + count_buffer_offset: wgt::BufferAddress, + max_count: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_multi_draw_indexed_indirect_count( + self, + buffer_id, + offset, + count_buffer_id, + count_buffer_offset, + max_count, + ) + } + + fn set_blend_constant( + &mut self, + context: &global::Global, + color: wgt::Color, + ) -> Result<(), RenderPassError> { + context.render_pass_set_blend_constant(self, color) + } + + fn set_scissor_rect( + &mut self, + context: &global::Global, + x: u32, + y: u32, + width: u32, + height: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_set_scissor_rect(self, x, y, width, height) + } + + fn set_viewport( + &mut self, + context: &global::Global, + x: f32, + y: f32, + width: f32, + height: f32, + min_depth: f32, + max_depth: f32, + ) -> Result<(), RenderPassError> { + context.render_pass_set_viewport(self, x, y, width, height, min_depth, max_depth) + } + + fn set_stencil_reference( + &mut self, + context: &global::Global, + reference: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_set_stencil_reference(self, reference) + } + + fn push_debug_group( + &mut self, + context: &global::Global, + label: &str, + color: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_push_debug_group(self, label, color) + } + + fn pop_debug_group(&mut self, context: &global::Global) -> Result<(), RenderPassError> { + context.render_pass_pop_debug_group(self) + } + + fn insert_debug_marker( + &mut self, + context: &global::Global, + label: &str, + color: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_insert_debug_marker(self, label, color) + } + + fn write_timestamp( + &mut self, + context: &global::Global, + query_set_id: id::QuerySetId, + query_index: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_write_timestamp(self, query_set_id, query_index) + } + + fn begin_occlusion_query( + &mut self, + context: &global::Global, + query_index: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_begin_occlusion_query(self, query_index) + } + + fn end_occlusion_query(&mut self, context: &global::Global) -> Result<(), RenderPassError> { + context.render_pass_end_occlusion_query(self) + } + + fn begin_pipeline_statistics_query( + &mut self, + context: &global::Global, + query_set_id: id::QuerySetId, + query_index: u32, + ) -> Result<(), RenderPassError> { + context.render_pass_begin_pipeline_statistics_query(self, query_set_id, query_index) + } + + fn end_pipeline_statistics_query( + &mut self, + context: &global::Global, + ) -> Result<(), RenderPassError> { + context.render_pass_end_pipeline_statistics_query(self) + } + + fn execute_bundles( + &mut self, + context: &global::Global, + bundles: &[id::RenderBundleId], + ) -> Result<(), RenderPassError> { + context.render_pass_execute_bundles(self, bundles) + } + + fn end(&mut self, context: &global::Global) -> Result<(), RenderPassError> { + context.render_pass_end(self) + } + + fn label(&self) -> Option<&str> { + self.label() + } +} diff --git a/wgpu-core/src/command/mod.rs b/wgpu-core/src/command/mod.rs index 26a7fcd302..e1f1a5ceef 100644 --- a/wgpu-core/src/command/mod.rs +++ b/wgpu-core/src/command/mod.rs @@ -6,6 +6,7 @@ mod compute; mod compute_command; mod draw; mod dyn_compute_pass; +mod dyn_render_pass; mod memory_init; mod query; mod render; @@ -18,8 +19,8 @@ use std::sync::Arc; pub(crate) use self::clear::clear_texture; pub use self::{ bundle::*, clear::ClearError, compute::*, compute_command::ComputeCommand, draw::*, - dyn_compute_pass::DynComputePass, query::*, render::*, render_command::RenderCommand, - transfer::*, + dyn_compute_pass::DynComputePass, dyn_render_pass::DynRenderPass, query::*, render::*, + render_command::RenderCommand, transfer::*, }; pub(crate) use allocator::CommandAllocator; @@ -608,8 +609,28 @@ pub enum CommandEncoderError { Device(#[from] DeviceError), #[error("Command encoder is locked by a previously created render/compute pass. Before recording any new commands, the pass must be ended.")] Locked, - #[error("QuerySet provided for pass timestamp writes is invalid.")] - InvalidTimestampWritesQuerySetId, + + #[error("QuerySet {0:?} for pass timestamp writes is invalid.")] + InvalidTimestampWritesQuerySetId(id::QuerySetId), + #[error("Attachment texture view {0:?} is invalid")] + InvalidAttachment(id::TextureViewId), + #[error("Attachment texture view {0:?} for resolve is invalid")] + InvalidResolveTarget(id::TextureViewId), + #[error("Depth stencil attachment view {0:?} is invalid")] + InvalidDepthStencilAttachment(id::TextureViewId), + #[error("Occlusion query set {0:?} is invalid")] + InvalidOcclusionQuerySetId(id::QuerySetId), +} + +impl PrettyError for CommandEncoderError { + fn fmt_pretty(&self, fmt: &mut ErrorFormatter) { + fmt.error(self); + if let Self::InvalidAttachment(id) = *self { + fmt.texture_view_label_with_key(&id, "attachment"); + } else if let Self::InvalidResolveTarget(id) = *self { + fmt.texture_view_label_with_key(&id, "resolve target"); + }; + } } impl Global { @@ -864,10 +885,7 @@ pub enum PassErrorScope { #[error("In a bundle parameter")] Bundle, #[error("In a pass parameter")] - // TODO: To be removed in favor of `Pass`. - // ComputePass is already operating on command buffer instead, - // same should apply to RenderPass in the future. - PassEncoder(id::CommandEncoderId), + PassEncoder(id::CommandEncoderId), // Needed only for ending pass via tracing. #[error("In a pass parameter")] Pass(Option), #[error("In a set_bind_group command")] diff --git a/wgpu-core/src/command/render.rs b/wgpu-core/src/command/render.rs index 39e61b10e1..6565b05264 100644 --- a/wgpu-core/src/command/render.rs +++ b/wgpu-core/src/command/render.rs @@ -13,9 +13,9 @@ use crate::{ bind::Binder, end_occlusion_query, end_pipeline_statistics_query, memory_init::{fixup_discarded_surfaces, SurfacesInDiscardState}, - BasePass, BindGroupStateChange, CommandBuffer, CommandEncoderError, CommandEncoderStatus, - DrawError, ExecutionError, MapPassErr, PassErrorScope, QueryUseError, RenderCommandError, - StateChange, + ArcPassTimestampWrites, BasePass, BindGroupStateChange, CommandBuffer, CommandEncoderError, + CommandEncoderStatus, DrawError, ExecutionError, MapPassErr, PassErrorScope, + PassTimestampWrites, QueryUseError, RenderCommandError, StateChange, }, device::{ AttachmentData, Device, DeviceError, MissingDownlevelFlags, MissingFeatures, @@ -31,7 +31,6 @@ use crate::{ DestroyedResourceError, MissingBufferUsageError, MissingTextureUsageError, ParentDevice, QuerySet, Texture, TextureView, TextureViewNotRenderableReason, }, - storage::Storage, track::{ResourceUsageCompatibilityError, TextureSelector, Tracker, UsageScope}, Label, }; @@ -50,14 +49,14 @@ use serde::Deserialize; use serde::Serialize; use std::sync::Arc; -use std::{borrow::Cow, fmt, iter, marker::PhantomData, mem, num::NonZeroU32, ops::Range, str}; +use std::{borrow::Cow, fmt, iter, mem, num::NonZeroU32, ops::Range, str}; use super::render_command::{ArcRenderCommand, RenderCommand}; use super::{ memory_init::TextureSurfaceDiscard, CommandBufferTextureMemoryActions, CommandEncoder, QueryResetMap, }; -use super::{DrawKind, PassTimestampWrites, Rect}; +use super::{DrawKind, DynRenderPass, Rect}; /// Operation to perform to the output attachment at the start of a renderpass. #[repr(C)] @@ -135,6 +134,17 @@ pub struct RenderPassColorAttachment { pub channel: PassChannel, } +/// Describes a color attachment to a render pass. +#[derive(Debug)] +struct ArcRenderPassColorAttachment { + /// The view to use as an attachment. + pub view: Arc>, + /// The view that will receive the resolved output if multisampling is used. + pub resolve_target: Option>>, + /// What operations will be performed on this color attachment. + pub channel: PassChannel, +} + /// Describes a depth/stencil attachment to a render pass. #[repr(C)] #[derive(Clone, Debug, PartialEq)] @@ -147,8 +157,18 @@ pub struct RenderPassDepthStencilAttachment { /// What operations will be performed on the stencil part of the attachment. pub stencil: PassChannel, } +/// Describes a depth/stencil attachment to a render pass. +#[derive(Debug)] +pub struct ArcRenderPassDepthStencilAttachment { + /// The view to use as an attachment. + pub view: Arc>, + /// What operations will be performed on the depth part of the attachment. + pub depth: PassChannel, + /// What operations will be performed on the stencil part of the attachment. + pub stencil: PassChannel, +} -impl RenderPassDepthStencilAttachment { +impl ArcRenderPassDepthStencilAttachment { /// Validate the given aspects' read-only flags against their load /// and store ops. /// @@ -200,37 +220,61 @@ pub struct RenderPassDescriptor<'a> { pub occlusion_query_set: Option, } -#[cfg_attr(feature = "serde", derive(Deserialize, Serialize))] -pub struct RenderPass { +/// Describes the attachments of a render pass. +struct ArcRenderPassDescriptor<'a, A: HalApi> { + pub label: &'a Label<'a>, + /// The color attachments of the render pass. + pub color_attachments: + ArrayVec>, { hal::MAX_COLOR_ATTACHMENTS }>, + /// The depth and stencil attachment of the render pass, if any. + pub depth_stencil_attachment: Option>, + /// Defines where and when timestamp values will be written for this pass. + pub timestamp_writes: Option>, + /// Defines where the occlusion query results will be stored for this pass. + pub occlusion_query_set: Option>>, +} + +pub struct RenderPass { /// All pass data & records is stored here. /// /// If this is `None`, the pass is in the 'ended' state and can no longer be used. /// Any attempt to record more commands will result in a validation error. - // TODO: this is soon to become `ArcRenderCommand` - base: Option>, + base: Option>>, + + /// Parent command buffer that this pass records commands into. + /// + /// If it is none, this pass is invalid and any operation on it will return an error. + parent: Option>>, - parent_id: id::CommandEncoderId, - color_targets: ArrayVec, { hal::MAX_COLOR_ATTACHMENTS }>, - depth_stencil_target: Option, - timestamp_writes: Option, - occlusion_query_set_id: Option, + color_attachments: + ArrayVec>, { hal::MAX_COLOR_ATTACHMENTS }>, + depth_stencil_attachment: Option>, + timestamp_writes: Option>, + occlusion_query_set: Option>>, // Resource binding dedupe state. - #[cfg_attr(feature = "serde", serde(skip))] current_bind_groups: BindGroupStateChange, - #[cfg_attr(feature = "serde", serde(skip))] current_pipeline: StateChange, } -impl RenderPass { - pub fn new(parent_id: id::CommandEncoderId, desc: &RenderPassDescriptor) -> Self { +impl RenderPass { + /// If the parent command buffer is invalid, the returned pass will be invalid. + fn new(parent: Option>>, desc: ArcRenderPassDescriptor) -> Self { + let ArcRenderPassDescriptor { + label, + timestamp_writes, + color_attachments, + depth_stencil_attachment, + occlusion_query_set, + } = desc; + Self { - base: Some(BasePass::new(&desc.label)), - parent_id, - color_targets: desc.color_attachments.iter().cloned().collect(), - depth_stencil_target: desc.depth_stencil_attachment.cloned(), - timestamp_writes: desc.timestamp_writes.cloned(), - occlusion_query_set_id: desc.occlusion_query_set, + base: Some(BasePass::new(label)), + parent, + color_attachments, + depth_stencil_attachment, + timestamp_writes, + occlusion_query_set, current_bind_groups: BindGroupStateChange::new(), current_pipeline: StateChange::new(), @@ -238,8 +282,8 @@ impl RenderPass { } #[inline] - pub fn parent_id(&self) -> id::CommandEncoderId { - self.parent_id + pub fn parent_id(&self) -> Option { + self.parent.as_ref().map(|cmd_buf| cmd_buf.as_info().id()) } #[inline] @@ -250,7 +294,7 @@ impl RenderPass { fn base_mut<'a>( &'a mut self, scope: PassErrorScope, - ) -> Result<&'a mut BasePass, RenderPassError> { + ) -> Result<&'a mut BasePass>, RenderPassError> { self.base .as_mut() .ok_or(RenderPassErrorInner::PassEnded) @@ -258,12 +302,12 @@ impl RenderPass { } } -impl fmt::Debug for RenderPass { +impl fmt::Debug for RenderPass { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { f.debug_struct("RenderPass") - .field("encoder_id", &self.parent_id) - .field("color_targets", &self.color_targets) - .field("depth_stencil_target", &self.depth_stencil_target) + .field("encoder_id", &self.parent_id()) + .field("color_attachments", &self.color_attachments) + .field("depth_stencil_target", &self.depth_stencil_attachment) .field( "command count", &self.base.as_ref().map_or(0, |base| base.commands.len()), @@ -408,7 +452,7 @@ impl VertexState { } } -struct State<'attachment, 'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A: HalApi> { +struct State<'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A: HalApi> { pipeline_flags: PipelineFlags, binder: Binder, blend_constant: OptionalState, @@ -418,7 +462,7 @@ struct State<'attachment, 'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A: HalA vertex: VertexState, debug_scope_depth: u32, - info: RenderPassInfo<'attachment, 'scope, A>, + info: RenderPassInfo<'scope, A>, snatch_guard: &'snatch_guard SnatchGuard<'snatch_guard>, @@ -436,8 +480,8 @@ struct State<'attachment, 'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A: HalA active_query: Option<(Arc>, u32)>, } -impl<'attachment, 'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A: HalApi> - State<'attachment, 'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A> +impl<'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A: HalApi> + State<'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A> { fn is_ready(&self, indexed: bool) -> Result<(), DrawError> { if let Some(pipeline) = self.pipeline.as_ref() { @@ -548,10 +592,22 @@ pub enum RenderPassErrorInner { ColorAttachment(#[from] ColorAttachmentError), #[error(transparent)] Encoder(#[from] CommandEncoderError), - #[error("Attachment texture view Id {0:?} is invalid")] + #[error("Parent encoder is invalid")] + InvalidParentEncoder, + #[error("Attachment texture view {0:?} is invalid")] InvalidAttachmentId(id::TextureViewId), + #[error("Attachment texture view {0:?} is invalid")] + InvalidResolveTargetId(id::TextureViewId), #[error("The format of the depth-stencil attachment ({0:?}) is not a depth-stencil format")] InvalidDepthStencilAttachmentFormat(wgt::TextureFormat), + #[error("Buffer {0:?} is invalid or destroyed")] + InvalidBuffer(id::BufferId), + #[error("Render pipeline {0:?} is invalid")] + InvalidPipeline(id::RenderPipelineId), + #[error("QuerySet {0:?} is invalid")] + InvalidQuerySet(id::QuerySetId), + #[error("Render bundle {0:?} is invalid")] + InvalidRenderBundle(id::RenderBundleId), #[error("The format of the {location} ({format:?}) is not resolvable")] UnsupportedResolveTargetFormat { location: AttachmentErrorLocation, @@ -661,8 +717,6 @@ pub enum RenderPassErrorInner { "Multiview pass texture views with more than one array layer must have D2Array dimension" )] MultiViewDimensionMismatch, - #[error("QuerySet {0:?} is invalid")] - InvalidQuerySet(id::QuerySetId), #[error("missing occlusion query set")] MissingOcclusionQuerySet, #[error(transparent)] @@ -732,9 +786,9 @@ where } } -struct RenderAttachment<'a, A: HalApi> { +struct RenderAttachment { texture: Arc>, - selector: &'a TextureSelector, + selector: TextureSelector, usage: hal::TextureUses, } @@ -742,7 +796,7 @@ impl TextureView { fn to_render_attachment(&self, usage: hal::TextureUses) -> RenderAttachment { RenderAttachment { texture: self.parent.clone(), - selector: &self.selector, + selector: self.selector.clone(), usage, } } @@ -751,22 +805,21 @@ impl TextureView { const MAX_TOTAL_ATTACHMENTS: usize = hal::MAX_COLOR_ATTACHMENTS + hal::MAX_COLOR_ATTACHMENTS + 1; type AttachmentDataVec = ArrayVec; -struct RenderPassInfo<'a, 'd, A: HalApi> { +struct RenderPassInfo<'d, A: HalApi> { context: RenderPassContext, usage_scope: UsageScope<'d, A>, /// All render attachments, including depth/stencil - render_attachments: AttachmentDataVec>, + render_attachments: AttachmentDataVec>, is_depth_read_only: bool, is_stencil_read_only: bool, extent: wgt::Extent3d, - _phantom: PhantomData, pending_discard_init_fixups: SurfacesInDiscardState, - divergent_discarded_depth_stencil_aspect: Option<(wgt::TextureAspect, &'a TextureView)>, + divergent_discarded_depth_stencil_aspect: Option<(wgt::TextureAspect, Arc>)>, multiview: Option, } -impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { +impl<'d, A: HalApi> RenderPassInfo<'d, A> { fn add_pass_texture_init_actions( channel: &PassChannel, texture_memory_actions: &mut CommandBufferTextureMemoryActions, @@ -804,17 +857,18 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { fn start( device: &'d Device, hal_label: Option<&str>, - color_attachments: &[Option], - depth_stencil_attachment: Option<&RenderPassDepthStencilAttachment>, - timestamp_writes: Option<&PassTimestampWrites>, - occlusion_query_set: Option>>, + color_attachments: ArrayVec< + Option>, + { hal::MAX_COLOR_ATTACHMENTS }, + >, + mut depth_stencil_attachment: Option>, + mut timestamp_writes: Option>, + mut occlusion_query_set: Option>>, encoder: &mut CommandEncoder, trackers: &mut Tracker, texture_memory_actions: &mut CommandBufferTextureMemoryActions, pending_query_resets: &mut QueryResetMap, - view_guard: &'a Storage>, - query_set_guard: &'a Storage>, - snatch_guard: &SnatchGuard<'a>, + snatch_guard: &SnatchGuard<'_>, ) -> Result { profiling::scope!("RenderPassInfo::start"); @@ -899,19 +953,10 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { Ok(()) }; - let mut colors = - ArrayVec::>, { hal::MAX_COLOR_ATTACHMENTS }>::new(); let mut depth_stencil = None; - if let Some(at) = depth_stencil_attachment { - let view = view_guard - .get(at.view) - .map_err(|_| RenderPassErrorInner::InvalidAttachmentId(at.view))?; - - trackers.views.add_single(view); - - let view = view.as_ref(); - + if let Some(at) = depth_stencil_attachment.as_ref() { + let view = &at.view; check_multiview(view)?; add_view(view, AttachmentErrorLocation::Depth)?; @@ -994,7 +1039,7 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { } else { wgt::TextureAspect::StencilOnly }, - view, + view.clone(), )); } else if at.depth.store_op == StoreOp::Discard { // Both are discarded using the regular path. @@ -1032,20 +1077,16 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { }); } + let mut color_attachments_hal = + ArrayVec::>, { hal::MAX_COLOR_ATTACHMENTS }>::new(); for (index, attachment) in color_attachments.iter().enumerate() { let at = if let Some(attachment) = attachment.as_ref() { attachment } else { - colors.push(None); + color_attachments_hal.push(None); continue; }; - - let color_view = view_guard - .get(at.view) - .map_err(|_| RenderPassErrorInner::InvalidAttachmentId(at.view))?; - - trackers.views.add_single(color_view); - + let color_view: &TextureView = &at.view; check_multiview(color_view)?; add_view( color_view, @@ -1075,13 +1116,7 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { .push(color_view.to_render_attachment(hal::TextureUses::COLOR_TARGET)); let mut hal_resolve_target = None; - if let Some(resolve_target) = at.resolve_target { - let resolve_view = view_guard - .get(resolve_target) - .map_err(|_| RenderPassErrorInner::InvalidAttachmentId(resolve_target))?; - - trackers.views.add_single(resolve_view); - + if let Some(resolve_view) = &at.resolve_target { check_multiview(resolve_view)?; let resolve_location = AttachmentErrorLocation::Color { @@ -1141,7 +1176,7 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { }); } - colors.push(Some(hal::ColorAttachment { + color_attachments_hal.push(Some(hal::ColorAttachment { target: hal::Attachment { view: color_view.try_raw(snatch_guard)?, usage: hal::TextureUses::COLOR_TARGET, @@ -1155,36 +1190,34 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { let extent = extent.ok_or(RenderPassErrorInner::MissingAttachments)?; let multiview = detected_multiview.expect("Multiview was not detected, no attachments"); - let view_data = AttachmentData { + let attachment_formats = AttachmentData { colors: color_attachments .iter() - .map(|at| at.as_ref().map(|at| view_guard.get(at.view).unwrap())) + .map(|at| at.as_ref().map(|at| at.view.desc.texture_format)) .collect(), resolves: color_attachments .iter() - .filter_map(|at| match *at { - Some(RenderPassColorAttachment { - resolve_target: Some(resolve), - .. - }) => Some(view_guard.get(resolve).unwrap()), - _ => None, + .filter_map(|at| { + at.as_ref().and_then(|at| { + at.resolve_target + .as_ref() + .map(|resolve| resolve.desc.format) + }) }) .collect(), - depth_stencil: depth_stencil_attachment.map(|at| view_guard.get(at.view).unwrap()), + depth_stencil: depth_stencil_attachment + .as_ref() + .map(|at| at.view.desc.format), }; let context = RenderPassContext { - attachments: view_data.map(|view| view.desc.format), + attachments: attachment_formats, sample_count, multiview, }; - let timestamp_writes = if let Some(tw) = timestamp_writes { - let query_set = query_set_guard - .get(tw.query_set) - .map_err(|_| RenderPassErrorInner::InvalidQuerySet(tw.query_set))?; - - trackers.query_sets.add_single(query_set); + let timestamp_writes_hal = timestamp_writes.as_ref().map(|tw| { + let query_set = &tw.query_set; if let Some(index) = tw.beginning_of_pass_write_index { pending_query_resets.use_query_set(query_set, index); @@ -1193,35 +1226,48 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { pending_query_resets.use_query_set(query_set, index); } - Some(hal::RenderPassTimestampWrites { + hal::RenderPassTimestampWrites { query_set: query_set.raw.as_ref().unwrap(), beginning_of_pass_write_index: tw.beginning_of_pass_write_index, end_of_pass_write_index: tw.end_of_pass_write_index, - }) - } else { - None - }; + } + }); - let occlusion_query_set = if let Some(query_set) = occlusion_query_set { - let query_set = trackers.query_sets.insert_single(query_set); - Some(query_set.raw.as_ref().unwrap()) - } else { - None - }; + let occlusion_query_set_hal = occlusion_query_set + .as_ref() + .map(|query_set| query_set.raw.as_ref().unwrap()); let hal_desc = hal::RenderPassDescriptor { label: hal_label, extent, sample_count, - color_attachments: &colors, + color_attachments: &color_attachments_hal, depth_stencil_attachment: depth_stencil, multiview, - timestamp_writes, - occlusion_query_set, + timestamp_writes: timestamp_writes_hal, + occlusion_query_set: occlusion_query_set_hal, }; unsafe { encoder.raw.begin_render_pass(&hal_desc); }; + drop(color_attachments_hal); // Drop, so we can consume `color_attachments` for the tracker. + + // Can't borrow the tracker more than once, so have to add to the tracker after the `begin_render_pass` hal call. + if let Some(tw) = timestamp_writes.take() { + trackers.query_sets.insert_single(tw.query_set); + }; + if let Some(occlusion_query_set) = occlusion_query_set.take() { + trackers.query_sets.insert_single(occlusion_query_set); + }; + if let Some(at) = depth_stencil_attachment.take() { + trackers.views.insert_single(at.view.clone()); + } + for at in color_attachments.into_iter().flatten() { + trackers.views.insert_single(at.view.clone()); + if let Some(resolve_target) = at.resolve_target { + trackers.views.insert_single(resolve_target); + } + } Ok(Self { context, @@ -1230,7 +1276,6 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { is_depth_read_only, is_stencil_read_only, extent, - _phantom: PhantomData, pending_discard_init_fixups, divergent_discarded_depth_stencil_aspect, multiview, @@ -1311,22 +1356,141 @@ impl<'a, 'd, A: HalApi> RenderPassInfo<'a, 'd, A> { } impl Global { - pub fn render_pass_end(&self, pass: &mut RenderPass) -> Result<(), RenderPassError> { - let scope = PassErrorScope::PassEncoder(pass.parent_id); - let base = pass - .base - .take() - .ok_or(RenderPassErrorInner::PassEnded) - .map_pass_err(scope)?; + /// Creates a render pass. + /// + /// If creation fails, an invalid pass is returned. + /// Any operation on an invalid pass will return an error. + /// + /// If successful, puts the encoder into the [`CommandEncoderStatus::Locked`] state. + pub fn command_encoder_create_render_pass( + &self, + encoder_id: id::CommandEncoderId, + desc: &RenderPassDescriptor<'_>, + ) -> (RenderPass, Option) { + fn fill_arc_desc( + hub: &crate::hub::Hub, + device: &Arc>, + desc: &RenderPassDescriptor<'_>, + arc_desc: &mut ArcRenderPassDescriptor, + ) -> Result<(), CommandEncoderError> { + let query_sets = hub.query_sets.read(); + let texture_views = hub.texture_views.read(); + + for color_attachment in desc.color_attachments.iter() { + if let Some(RenderPassColorAttachment { + view: view_id, + resolve_target, + channel, + }) = color_attachment + { + let view = texture_views + .get_owned(*view_id) + .map_err(|_| CommandEncoderError::InvalidAttachment(*view_id))?; + view.same_device(device)?; + + let resolve_target = if let Some(resolve_target_id) = resolve_target { + let rt_arc = texture_views.get_owned(*resolve_target_id).map_err(|_| { + CommandEncoderError::InvalidResolveTarget(*resolve_target_id) + })?; + rt_arc.same_device(device)?; + + Some(rt_arc) + } else { + None + }; + + arc_desc + .color_attachments + .push(Some(ArcRenderPassColorAttachment { + view, + resolve_target, + channel: channel.clone(), + })); + } else { + arc_desc.color_attachments.push(None); + } + } + + arc_desc.depth_stencil_attachment = + if let Some(depth_stencil_attachment) = desc.depth_stencil_attachment { + let view = texture_views + .get_owned(depth_stencil_attachment.view) + .map_err(|_| { + CommandEncoderError::InvalidDepthStencilAttachment( + depth_stencil_attachment.view, + ) + })?; + view.same_device(device)?; + + Some(ArcRenderPassDepthStencilAttachment { + view, + depth: depth_stencil_attachment.depth.clone(), + stencil: depth_stencil_attachment.stencil.clone(), + }) + } else { + None + }; + + arc_desc.timestamp_writes = if let Some(tw) = desc.timestamp_writes { + let query_set = query_sets.get_owned(tw.query_set).map_err(|_| { + CommandEncoderError::InvalidTimestampWritesQuerySetId(tw.query_set) + })?; + query_set.same_device(device)?; + + Some(ArcPassTimestampWrites { + query_set, + beginning_of_pass_write_index: tw.beginning_of_pass_write_index, + end_of_pass_write_index: tw.end_of_pass_write_index, + }) + } else { + None + }; + + arc_desc.occlusion_query_set = + if let Some(occlusion_query_set) = desc.occlusion_query_set { + let query_set = query_sets.get_owned(occlusion_query_set).map_err(|_| { + CommandEncoderError::InvalidOcclusionQuerySetId(occlusion_query_set) + })?; + query_set.same_device(device)?; + + Some(query_set) + } else { + None + }; + + Ok(()) + } + + let hub = A::hub(self); + let mut arc_desc = ArcRenderPassDescriptor { + label: &desc.label, + timestamp_writes: None, + color_attachments: ArrayVec::new(), + depth_stencil_attachment: None, + occlusion_query_set: None, + }; + + let cmd_buf = match CommandBuffer::lock_encoder(hub, encoder_id) { + Ok(cmd_buf) => cmd_buf, + Err(e) => return (RenderPass::new(None, arc_desc), Some(e)), + }; - self.render_pass_end_with_unresolved_commands::( - pass.parent_id, - base, - &pass.color_targets, - pass.depth_stencil_target.as_ref(), - pass.timestamp_writes.as_ref(), - pass.occlusion_query_set_id, - ) + let err = fill_arc_desc(hub, &cmd_buf.device, desc, &mut arc_desc).err(); + + (RenderPass::new(Some(cmd_buf), arc_desc), err) + } + + /// Creates a type erased render pass. + /// + /// If creation fails, an invalid pass is returned. + /// Any operation on an invalid pass will return an error. + pub fn command_encoder_create_render_pass_dyn( + &self, + encoder_id: id::CommandEncoderId, + desc: &RenderPassDescriptor<'_>, + ) -> (Box, Option) { + let (pass, err) = self.command_encoder_create_render_pass::(encoder_id, desc); + (Box::new(pass), err) } #[doc(hidden)] @@ -1337,62 +1501,78 @@ impl Global { color_attachments: &[Option], depth_stencil_attachment: Option<&RenderPassDepthStencilAttachment>, timestamp_writes: Option<&PassTimestampWrites>, - occlusion_query_set_id: Option, + occlusion_query_set: Option, ) -> Result<(), RenderPassError> { - let pass_scope = PassErrorScope::PassEncoder(encoder_id); + let BasePass { + label, + commands, + dynamic_offsets, + string_data, + push_constant_data, + } = base; + + let (mut render_pass, encoder_error) = self.command_encoder_create_render_pass::( + encoder_id, + &RenderPassDescriptor { + label: label.as_deref().map(Cow::Borrowed), + color_attachments: Cow::Borrowed(color_attachments), + depth_stencil_attachment, + timestamp_writes, + occlusion_query_set, + }, + ); + if let Some(err) = encoder_error { + return Err(RenderPassError { + scope: PassErrorScope::PassEncoder(encoder_id), + inner: err.into(), + }); + }; let hub = A::hub(self); + render_pass.base = Some(BasePass { + label, + commands: RenderCommand::resolve_render_command_ids(hub, &commands)?, + dynamic_offsets, + string_data, + push_constant_data, + }); - let commands = RenderCommand::resolve_render_command_ids(hub, &base.commands)?; - - let occlusion_query_set = occlusion_query_set_id - .map(|id| { - hub.query_sets - .get(id) - .map_err(|_| RenderPassErrorInner::InvalidQuerySet(id)) + if let Some(err) = encoder_error { + Err(RenderPassError { + scope: PassErrorScope::PassEncoder(encoder_id), + inner: err.into(), }) - .transpose() - .map_pass_err(pass_scope)?; - - self.render_pass_end_impl::( - encoder_id, - BasePass { - label: base.label, - commands, - dynamic_offsets: base.dynamic_offsets, - string_data: base.string_data, - push_constant_data: base.push_constant_data, - }, - color_attachments, - depth_stencil_attachment, - timestamp_writes, - occlusion_query_set, - ) + } else { + self.render_pass_end(&mut render_pass) + } } #[doc(hidden)] - pub fn render_pass_end_impl( + pub fn render_pass_end( &self, - encoder_id: id::CommandEncoderId, - base: BasePass>, - color_attachments: &[Option], - depth_stencil_attachment: Option<&RenderPassDepthStencilAttachment>, - timestamp_writes: Option<&PassTimestampWrites>, - occlusion_query_set: Option>>, + pass: &mut RenderPass, ) -> Result<(), RenderPassError> { + let pass_scope = PassErrorScope::Pass(pass.parent_id()); + + let base = pass + .base + .take() + .ok_or(RenderPassErrorInner::PassEnded) + .map_pass_err(pass_scope)?; + profiling::scope!( "CommandEncoder::run_render_pass {}", base.label.unwrap_or("") ); - let hal_label = hal_label(base.label.as_deref(), self.instance.flags); - - let pass_scope = PassErrorScope::PassEncoder(encoder_id); + let Some(cmd_buf) = pass.parent.as_ref() else { + return Err(RenderPassErrorInner::InvalidParentEncoder).map_pass_err(pass_scope); + }; + cmd_buf.unlock_encoder().map_pass_err(pass_scope)?; + let cmd_buf_id = cmd_buf.as_info().id(); - let hub = A::hub(self); + let hal_label = hal_label(base.label.as_deref(), self.instance.flags); - let cmd_buf: Arc> = - CommandBuffer::get_encoder(hub, encoder_id).map_pass_err(pass_scope)?; let device = &cmd_buf.device; let snatch_guard = &device.snatchable_lock.read(); @@ -1410,12 +1590,35 @@ impl Global { string_data: base.string_data.to_vec(), push_constant_data: base.push_constant_data.to_vec(), }, - target_colors: color_attachments.to_vec(), - target_depth_stencil: depth_stencil_attachment.cloned(), - timestamp_writes: timestamp_writes.cloned(), - occlusion_query_set_id: occlusion_query_set + target_colors: pass + .color_attachments + .iter() + .map(|attachment| { + attachment.as_ref().map(|a| RenderPassColorAttachment { + view: a.view.as_info().id(), + resolve_target: a.resolve_target.as_ref().map(|a| a.as_info().id()), + channel: a.channel.clone(), + }) + }) + .collect(), + target_depth_stencil: pass.depth_stencil_attachment.as_ref().map(|d| { + RenderPassDepthStencilAttachment { + view: d.view.as_info().id(), + depth: d.depth.clone(), + stencil: d.stencil.clone(), + } + }), + timestamp_writes: pass.timestamp_writes.as_ref().map(|tw| { + PassTimestampWrites { + query_set: tw.query_set.as_info().id(), + beginning_of_pass_write_index: tw.beginning_of_pass_write_index, + end_of_pass_write_index: tw.end_of_pass_write_index, + } + }), + occlusion_query_set_id: pass + .occlusion_query_set .as_ref() - .map(|query_set| query_set.as_info().id()), + .map(|q| q.as_info().id()), }); } @@ -1436,27 +1639,24 @@ impl Global { *status = CommandEncoderStatus::Error; encoder.open_pass(hal_label).map_pass_err(pass_scope)?; - let query_set_guard = hub.query_sets.read(); - let view_guard = hub.texture_views.read(); - log::trace!( "Encoding render pass begin in command buffer {:?}", - encoder_id + cmd_buf_id ); let info = RenderPassInfo::start( device, hal_label, - color_attachments, - depth_stencil_attachment, - timestamp_writes, - occlusion_query_set.clone(), + pass.color_attachments.take(), + pass.depth_stencil_attachment.take(), + pass.timestamp_writes.take(), + // Still needed down the line. + // TODO(wumpf): by restructuring the code, we could get rid of some of this Arc clone. + pass.occlusion_query_set.clone(), encoder, tracker, texture_memory_actions, pending_query_resets, - &*view_guard, - &*query_set_guard, snatch_guard, ) .map_pass_err(pass_scope)?; @@ -1510,7 +1710,7 @@ impl Global { let scope = PassErrorScope::SetBindGroup; set_bind_group( &mut state, - &cmd_buf, + cmd_buf, &base.dynamic_offsets, index, num_dynamic_offsets, @@ -1520,7 +1720,7 @@ impl Global { } ArcRenderCommand::SetPipeline(pipeline) => { let scope = PassErrorScope::SetPipelineRender; - set_pipeline(&mut state, &cmd_buf, pipeline).map_pass_err(scope)?; + set_pipeline(&mut state, cmd_buf, pipeline).map_pass_err(scope)?; } ArcRenderCommand::SetIndexBuffer { buffer, @@ -1529,7 +1729,7 @@ impl Global { size, } => { let scope = PassErrorScope::SetIndexBuffer; - set_index_buffer(&mut state, &cmd_buf, buffer, index_format, offset, size) + set_index_buffer(&mut state, cmd_buf, buffer, index_format, offset, size) .map_pass_err(scope)?; } ArcRenderCommand::SetVertexBuffer { @@ -1539,7 +1739,7 @@ impl Global { size, } => { let scope = PassErrorScope::SetVertexBuffer; - set_vertex_buffer(&mut state, &cmd_buf, slot, buffer, offset, size) + set_vertex_buffer(&mut state, cmd_buf, slot, buffer, offset, size) .map_pass_err(scope)?; } ArcRenderCommand::SetBlendConstant(ref color) => { @@ -1684,7 +1884,8 @@ impl Global { api_log!("RenderPass::begin_occlusion_query {query_index}"); let scope = PassErrorScope::BeginOcclusionQuery; - let query_set = occlusion_query_set + let query_set = pass + .occlusion_query_set .clone() .ok_or(RenderPassErrorInner::MissingOcclusionQuerySet) .map_pass_err(scope)?; @@ -1736,12 +1937,12 @@ impl Global { } ArcRenderCommand::ExecuteBundle(bundle) => { let scope = PassErrorScope::ExecuteBundle; - execute_bundle(&mut state, &cmd_buf, bundle).map_pass_err(scope)?; + execute_bundle(&mut state, cmd_buf, bundle).map_pass_err(scope)?; } } } - log::trace!("Merging renderpass into cmd_buf {:?}", encoder_id); + log::trace!("Merging renderpass into cmd_buf {:?}", cmd_buf_id); let (trackers, pending_discard_init_fixups) = state .info .finish(state.raw_encoder, state.snatch_guard) @@ -1751,10 +1952,6 @@ impl Global { (trackers, pending_discard_init_fixups) }; - let cmd_buf = hub - .command_buffers - .get(encoder_id.into_command_buffer_id()) - .unwrap(); let mut cmd_buf_data = cmd_buf.data.lock(); let cmd_buf_data = cmd_buf_data.as_mut().unwrap(); @@ -2607,9 +2804,41 @@ fn execute_bundle( } impl Global { - pub fn render_pass_set_bind_group( + fn resolve_render_pass_buffer_id( + &self, + scope: PassErrorScope, + buffer_id: id::Id, + ) -> Result>, RenderPassError> { + let hub = A::hub(self); + let buffer = hub + .buffers + .read() + .get_owned(buffer_id) + .map_err(|_| RenderPassErrorInner::InvalidBuffer(buffer_id)) + .map_pass_err(scope)?; + + Ok(buffer) + } + + fn resolve_render_pass_query_set( + &self, + scope: PassErrorScope, + query_set_id: id::Id, + ) -> Result>, RenderPassError> { + let hub = A::hub(self); + let query_set = hub + .query_sets + .read() + .get_owned(query_set_id) + .map_err(|_| RenderPassErrorInner::InvalidQuerySet(query_set_id)) + .map_pass_err(scope)?; + + Ok(query_set) + } + + pub fn render_pass_set_bind_group( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, index: u32, bind_group_id: id::BindGroupId, offsets: &[DynamicOffset], @@ -2631,18 +2860,26 @@ impl Global { return Ok(()); } - base.commands.push(RenderCommand::SetBindGroup { + let hub = A::hub(self); + let bind_group = hub + .bind_groups + .read() + .get_owned(bind_group_id) + .map_err(|_| RenderPassErrorInner::InvalidBindGroup(index)) + .map_pass_err(scope)?; + + base.commands.push(ArcRenderCommand::SetBindGroup { index, num_dynamic_offsets: offsets.len(), - bind_group_id, + bind_group, }); Ok(()) } - pub fn render_pass_set_pipeline( + pub fn render_pass_set_pipeline( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, pipeline_id: id::RenderPipelineId, ) -> Result<(), RenderPassError> { let scope = PassErrorScope::SetPipelineRender; @@ -2655,14 +2892,22 @@ impl Global { return Ok(()); } - base.commands.push(RenderCommand::SetPipeline(pipeline_id)); + let hub = A::hub(self); + let pipeline = hub + .render_pipelines + .read() + .get_owned(pipeline_id) + .map_err(|_| RenderPassErrorInner::InvalidPipeline(pipeline_id)) + .map_pass_err(scope)?; + + base.commands.push(ArcRenderCommand::SetPipeline(pipeline)); Ok(()) } - pub fn render_pass_set_index_buffer( + pub fn render_pass_set_index_buffer( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, buffer_id: id::BufferId, index_format: IndexFormat, offset: BufferAddress, @@ -2671,8 +2916,8 @@ impl Global { let scope = PassErrorScope::SetIndexBuffer; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::SetIndexBuffer { - buffer_id, + base.commands.push(ArcRenderCommand::SetIndexBuffer { + buffer: self.resolve_render_pass_buffer_id(scope, buffer_id)?, index_format, offset, size, @@ -2681,9 +2926,9 @@ impl Global { Ok(()) } - pub fn render_pass_set_vertex_buffer( + pub fn render_pass_set_vertex_buffer( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, slot: u32, buffer_id: id::BufferId, offset: BufferAddress, @@ -2692,9 +2937,9 @@ impl Global { let scope = PassErrorScope::SetVertexBuffer; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::SetVertexBuffer { + base.commands.push(ArcRenderCommand::SetVertexBuffer { slot, - buffer_id, + buffer: self.resolve_render_pass_buffer_id(scope, buffer_id)?, offset, size, }); @@ -2702,36 +2947,37 @@ impl Global { Ok(()) } - pub fn render_pass_set_blend_constant( + pub fn render_pass_set_blend_constant( &self, - pass: &mut RenderPass, - color: &Color, + pass: &mut RenderPass, + color: Color, ) -> Result<(), RenderPassError> { let scope = PassErrorScope::SetBlendConstant; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::SetBlendConstant(*color)); + base.commands + .push(ArcRenderCommand::SetBlendConstant(color)); Ok(()) } - pub fn render_pass_set_stencil_reference( + pub fn render_pass_set_stencil_reference( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, value: u32, ) -> Result<(), RenderPassError> { let scope = PassErrorScope::SetStencilReference; let base = pass.base_mut(scope)?; base.commands - .push(RenderCommand::SetStencilReference(value)); + .push(ArcRenderCommand::SetStencilReference(value)); Ok(()) } - pub fn render_pass_set_viewport( + pub fn render_pass_set_viewport( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, x: f32, y: f32, w: f32, @@ -2742,7 +2988,7 @@ impl Global { let scope = PassErrorScope::SetViewport; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::SetViewport { + base.commands.push(ArcRenderCommand::SetViewport { rect: Rect { x, y, w, h }, depth_min, depth_max, @@ -2751,9 +2997,9 @@ impl Global { Ok(()) } - pub fn render_pass_set_scissor_rect( + pub fn render_pass_set_scissor_rect( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, x: u32, y: u32, w: u32, @@ -2763,14 +3009,14 @@ impl Global { let base = pass.base_mut(scope)?; base.commands - .push(RenderCommand::SetScissor(Rect { x, y, w, h })); + .push(ArcRenderCommand::SetScissor(Rect { x, y, w, h })); Ok(()) } - pub fn render_pass_set_push_constants( + pub fn render_pass_set_push_constants( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, stages: ShaderStages, offset: u32, data: &[u8], @@ -2797,7 +3043,7 @@ impl Global { .map(|arr| u32::from_ne_bytes([arr[0], arr[1], arr[2], arr[3]])), ); - base.commands.push(RenderCommand::SetPushConstant { + base.commands.push(ArcRenderCommand::SetPushConstant { stages, offset, size_bytes: data.len() as u32, @@ -2807,9 +3053,9 @@ impl Global { Ok(()) } - pub fn render_pass_draw( + pub fn render_pass_draw( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, vertex_count: u32, instance_count: u32, first_vertex: u32, @@ -2821,7 +3067,7 @@ impl Global { }; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::Draw { + base.commands.push(ArcRenderCommand::Draw { vertex_count, instance_count, first_vertex, @@ -2831,9 +3077,9 @@ impl Global { Ok(()) } - pub fn render_pass_draw_indexed( + pub fn render_pass_draw_indexed( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, index_count: u32, instance_count: u32, first_index: u32, @@ -2846,7 +3092,7 @@ impl Global { }; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::DrawIndexed { + base.commands.push(ArcRenderCommand::DrawIndexed { index_count, instance_count, first_index, @@ -2857,9 +3103,9 @@ impl Global { Ok(()) } - pub fn render_pass_draw_indirect( + pub fn render_pass_draw_indirect( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, buffer_id: id::BufferId, offset: BufferAddress, ) -> Result<(), RenderPassError> { @@ -2869,8 +3115,8 @@ impl Global { }; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::MultiDrawIndirect { - buffer_id, + base.commands.push(ArcRenderCommand::MultiDrawIndirect { + buffer: self.resolve_render_pass_buffer_id(scope, buffer_id)?, offset, count: None, indexed: false, @@ -2879,9 +3125,9 @@ impl Global { Ok(()) } - pub fn render_pass_draw_indexed_indirect( + pub fn render_pass_draw_indexed_indirect( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, buffer_id: id::BufferId, offset: BufferAddress, ) -> Result<(), RenderPassError> { @@ -2891,8 +3137,8 @@ impl Global { }; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::MultiDrawIndirect { - buffer_id, + base.commands.push(ArcRenderCommand::MultiDrawIndirect { + buffer: self.resolve_render_pass_buffer_id(scope, buffer_id)?, offset, count: None, indexed: true, @@ -2901,9 +3147,9 @@ impl Global { Ok(()) } - pub fn render_pass_multi_draw_indirect( + pub fn render_pass_multi_draw_indirect( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, buffer_id: id::BufferId, offset: BufferAddress, count: u32, @@ -2914,8 +3160,8 @@ impl Global { }; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::MultiDrawIndirect { - buffer_id, + base.commands.push(ArcRenderCommand::MultiDrawIndirect { + buffer: self.resolve_render_pass_buffer_id(scope, buffer_id)?, offset, count: NonZeroU32::new(count), indexed: false, @@ -2924,9 +3170,9 @@ impl Global { Ok(()) } - pub fn render_pass_multi_draw_indexed_indirect( + pub fn render_pass_multi_draw_indexed_indirect( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, buffer_id: id::BufferId, offset: BufferAddress, count: u32, @@ -2937,8 +3183,8 @@ impl Global { }; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::MultiDrawIndirect { - buffer_id, + base.commands.push(ArcRenderCommand::MultiDrawIndirect { + buffer: self.resolve_render_pass_buffer_id(scope, buffer_id)?, offset, count: NonZeroU32::new(count), indexed: true, @@ -2947,9 +3193,9 @@ impl Global { Ok(()) } - pub fn render_pass_multi_draw_indirect_count( + pub fn render_pass_multi_draw_indirect_count( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, buffer_id: id::BufferId, offset: BufferAddress, count_buffer_id: id::BufferId, @@ -2962,21 +3208,34 @@ impl Global { }; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::MultiDrawIndirectCount { - buffer_id, - offset, - count_buffer_id, - count_buffer_offset, - max_count, - indexed: false, - }); + // Don't use resolve_render_pass_buffer_id here, because we don't want to take the read-lock twice. + let hub = A::hub(self); + let buffers = hub.buffers.read(); + let buffer = buffers + .get_owned(buffer_id) + .map_err(|_| RenderPassErrorInner::InvalidBuffer(buffer_id)) + .map_pass_err(scope)?; + let count_buffer = buffers + .get_owned(buffer_id) + .map_err(|_| RenderPassErrorInner::InvalidBuffer(count_buffer_id)) + .map_pass_err(scope)?; + + base.commands + .push(ArcRenderCommand::MultiDrawIndirectCount { + buffer, + offset, + count_buffer, + count_buffer_offset, + max_count, + indexed: false, + }); Ok(()) } - pub fn render_pass_multi_draw_indexed_indirect_count( + pub fn render_pass_multi_draw_indexed_indirect_count( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, buffer_id: id::BufferId, offset: BufferAddress, count_buffer_id: id::BufferId, @@ -2989,21 +3248,35 @@ impl Global { }; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::MultiDrawIndirectCount { - buffer_id, - offset, - count_buffer_id, - count_buffer_offset, - max_count, - indexed: true, - }); + // Don't use resolve_render_pass_buffer_id here, because we don't want to take the read-lock twice. + let hub = A::hub(self); + let buffers = hub.buffers.read(); + let buffer = buffers + .get_owned(buffer_id) + .map_err(|_| RenderPassErrorInner::InvalidBuffer(buffer_id)) + .map_pass_err(scope)?; + + let count_buffer = buffers + .get_owned(buffer_id) + .map_err(|_| RenderPassErrorInner::InvalidBuffer(count_buffer_id)) + .map_pass_err(scope)?; + + base.commands + .push(ArcRenderCommand::MultiDrawIndirectCount { + buffer, + offset, + count_buffer, + count_buffer_offset, + max_count, + indexed: true, + }); Ok(()) } - pub fn render_pass_push_debug_group( + pub fn render_pass_push_debug_group( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, label: &str, color: u32, ) -> Result<(), RenderPassError> { @@ -3012,7 +3285,7 @@ impl Global { let bytes = label.as_bytes(); base.string_data.extend_from_slice(bytes); - base.commands.push(RenderCommand::PushDebugGroup { + base.commands.push(ArcRenderCommand::PushDebugGroup { color, len: bytes.len(), }); @@ -3020,20 +3293,20 @@ impl Global { Ok(()) } - pub fn render_pass_pop_debug_group( + pub fn render_pass_pop_debug_group( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, ) -> Result<(), RenderPassError> { let base = pass.base_mut(PassErrorScope::PopDebugGroup)?; - base.commands.push(RenderCommand::PopDebugGroup); + base.commands.push(ArcRenderCommand::PopDebugGroup); Ok(()) } - pub fn render_pass_insert_debug_marker( + pub fn render_pass_insert_debug_marker( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, label: &str, color: u32, ) -> Result<(), RenderPassError> { @@ -3042,7 +3315,7 @@ impl Global { let bytes = label.as_bytes(); base.string_data.extend_from_slice(bytes); - base.commands.push(RenderCommand::InsertDebugMarker { + base.commands.push(ArcRenderCommand::InsertDebugMarker { color, len: bytes.len(), }); @@ -3050,52 +3323,52 @@ impl Global { Ok(()) } - pub fn render_pass_write_timestamp( + pub fn render_pass_write_timestamp( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, query_set_id: id::QuerySetId, query_index: u32, ) -> Result<(), RenderPassError> { let scope = PassErrorScope::WriteTimestamp; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::WriteTimestamp { - query_set_id, + base.commands.push(ArcRenderCommand::WriteTimestamp { + query_set: self.resolve_render_pass_query_set(scope, query_set_id)?, query_index, }); Ok(()) } - pub fn render_pass_begin_occlusion_query( + pub fn render_pass_begin_occlusion_query( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, query_index: u32, ) -> Result<(), RenderPassError> { let scope = PassErrorScope::BeginOcclusionQuery; let base = pass.base_mut(scope)?; base.commands - .push(RenderCommand::BeginOcclusionQuery { query_index }); + .push(ArcRenderCommand::BeginOcclusionQuery { query_index }); Ok(()) } - pub fn render_pass_end_occlusion_query( + pub fn render_pass_end_occlusion_query( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, ) -> Result<(), RenderPassError> { let scope = PassErrorScope::EndOcclusionQuery; let base = pass.base_mut(scope)?; - base.commands.push(RenderCommand::EndOcclusionQuery); + base.commands.push(ArcRenderCommand::EndOcclusionQuery); Ok(()) } - pub fn render_pass_begin_pipeline_statistics_query( + pub fn render_pass_begin_pipeline_statistics_query( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, query_set_id: id::QuerySetId, query_index: u32, ) -> Result<(), RenderPassError> { @@ -3103,37 +3376,45 @@ impl Global { let base = pass.base_mut(scope)?; base.commands - .push(RenderCommand::BeginPipelineStatisticsQuery { - query_set_id, + .push(ArcRenderCommand::BeginPipelineStatisticsQuery { + query_set: self.resolve_render_pass_query_set(scope, query_set_id)?, query_index, }); Ok(()) } - pub fn render_pass_end_pipeline_statistics_query( + pub fn render_pass_end_pipeline_statistics_query( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, ) -> Result<(), RenderPassError> { let scope = PassErrorScope::EndPipelineStatisticsQuery; let base = pass.base_mut(scope)?; base.commands - .push(RenderCommand::EndPipelineStatisticsQuery); + .push(ArcRenderCommand::EndPipelineStatisticsQuery); Ok(()) } - pub fn render_pass_execute_bundles( + pub fn render_pass_execute_bundles( &self, - pass: &mut RenderPass, + pass: &mut RenderPass, render_bundle_ids: &[id::RenderBundleId], ) -> Result<(), RenderPassError> { let scope = PassErrorScope::ExecuteBundle; let base = pass.base_mut(scope)?; + let hub = A::hub(self); + let bundles = hub.render_bundles.read(); + for &bundle_id in render_bundle_ids { - base.commands.push(RenderCommand::ExecuteBundle(bundle_id)); + let bundle = bundles + .get_owned(bundle_id) + .map_err(|_| RenderPassErrorInner::InvalidRenderBundle(bundle_id)) + .map_pass_err(scope)?; + + base.commands.push(ArcRenderCommand::ExecuteBundle(bundle)); } pass.current_pipeline.reset(); pass.current_bind_groups.reset(); diff --git a/wgpu-core/src/device/mod.rs b/wgpu-core/src/device/mod.rs index ab774d87c0..39b74ddcbb 100644 --- a/wgpu-core/src/device/mod.rs +++ b/wgpu-core/src/device/mod.rs @@ -60,15 +60,6 @@ pub(crate) struct AttachmentData { pub depth_stencil: Option, } impl Eq for AttachmentData {} -impl AttachmentData { - pub(crate) fn map U>(&self, fun: F) -> AttachmentData { - AttachmentData { - colors: self.colors.iter().map(|c| c.as_ref().map(&fun)).collect(), - resolves: self.resolves.iter().map(&fun).collect(), - depth_stencil: self.depth_stencil.as_ref().map(&fun), - } - } -} #[derive(Clone, Debug, Hash, PartialEq)] #[cfg_attr(feature = "serde", derive(serde::Deserialize, serde::Serialize))] diff --git a/wgpu/src/backend/wgpu_core.rs b/wgpu/src/backend/wgpu_core.rs index 3dbbd92d21..8f424863bc 100644 --- a/wgpu/src/backend/wgpu_core.rs +++ b/wgpu/src/backend/wgpu_core.rs @@ -490,7 +490,7 @@ pub struct ComputePass { #[derive(Debug)] pub struct RenderPass { - pass: wgc::command::RenderPass, + pass: Box, error_sink: ErrorSink, } @@ -1988,21 +1988,28 @@ impl crate::Context for ContextWgpuCore { end_of_pass_write_index: tw.end_of_pass_write_index, }); + let (pass, err) = gfx_select!(encoder => self.0.command_encoder_create_render_pass_dyn(*encoder, &wgc::command::RenderPassDescriptor { + label: desc.label.map(Borrowed), + timestamp_writes: timestamp_writes.as_ref(), + color_attachments: std::borrow::Cow::Borrowed(&colors), + depth_stencil_attachment: depth_stencil.as_ref(), + occlusion_query_set: desc.occlusion_query_set.map(|query_set| query_set.id.into()), + })); + + if let Some(cause) = err { + self.handle_error( + &encoder_data.error_sink, + cause, + LABEL, + desc.label, + "CommandEncoder::begin_compute_pass", + ); + } + ( Unused, - RenderPass { - pass: wgc::command::RenderPass::new( - *encoder, - &wgc::command::RenderPassDescriptor { - label: desc.label.map(Borrowed), - color_attachments: Borrowed(&colors), - depth_stencil_attachment: depth_stencil.as_ref(), - timestamp_writes: timestamp_writes.as_ref(), - occlusion_query_set: desc - .occlusion_query_set - .map(|query_set| query_set.id.into()), - }, - ), + Self::RenderPassData { + pass, error_sink: encoder_data.error_sink.clone(), }, ) @@ -2810,10 +2817,7 @@ impl crate::Context for ContextWgpuCore { pipeline: &Self::RenderPipelineId, _pipeline_data: &Self::RenderPipelineData, ) { - if let Err(cause) = self - .0 - .render_pass_set_pipeline(&mut pass_data.pass, *pipeline) - { + if let Err(cause) = pass_data.pass.set_pipeline(&self.0, *pipeline) { self.handle_error( &pass_data.error_sink, cause, @@ -2833,9 +2837,9 @@ impl crate::Context for ContextWgpuCore { _bind_group_data: &Self::BindGroupData, offsets: &[wgt::DynamicOffset], ) { - if let Err(cause) = - self.0 - .render_pass_set_bind_group(&mut pass_data.pass, index, *bind_group, offsets) + if let Err(cause) = pass_data + .pass + .set_bind_group(&self.0, index, *bind_group, offsets) { self.handle_error( &pass_data.error_sink, @@ -2857,13 +2861,11 @@ impl crate::Context for ContextWgpuCore { offset: wgt::BufferAddress, size: Option, ) { - if let Err(cause) = self.0.render_pass_set_index_buffer( - &mut pass_data.pass, - *buffer, - index_format, - offset, - size, - ) { + if let Err(cause) = + pass_data + .pass + .set_index_buffer(&self.0, *buffer, index_format, offset, size) + { self.handle_error( &pass_data.error_sink, cause, @@ -2884,9 +2886,9 @@ impl crate::Context for ContextWgpuCore { offset: wgt::BufferAddress, size: Option, ) { - if let Err(cause) = - self.0 - .render_pass_set_vertex_buffer(&mut pass_data.pass, slot, *buffer, offset, size) + if let Err(cause) = pass_data + .pass + .set_vertex_buffer(&self.0, slot, *buffer, offset, size) { self.handle_error( &pass_data.error_sink, @@ -2906,9 +2908,9 @@ impl crate::Context for ContextWgpuCore { offset: u32, data: &[u8], ) { - if let Err(cause) = - self.0 - .render_pass_set_push_constants(&mut pass_data.pass, stages, offset, data) + if let Err(cause) = pass_data + .pass + .set_push_constants(&self.0, stages, offset, data) { self.handle_error( &pass_data.error_sink, @@ -2927,8 +2929,8 @@ impl crate::Context for ContextWgpuCore { vertices: Range, instances: Range, ) { - if let Err(cause) = self.0.render_pass_draw( - &mut pass_data.pass, + if let Err(cause) = pass_data.pass.draw( + &self.0, vertices.end - vertices.start, instances.end - instances.start, vertices.start, @@ -2952,8 +2954,8 @@ impl crate::Context for ContextWgpuCore { base_vertex: i32, instances: Range, ) { - if let Err(cause) = self.0.render_pass_draw_indexed( - &mut pass_data.pass, + if let Err(cause) = pass_data.pass.draw_indexed( + &self.0, indices.end - indices.start, instances.end - instances.start, indices.start, @@ -2978,9 +2980,9 @@ impl crate::Context for ContextWgpuCore { _indirect_buffer_data: &Self::BufferData, indirect_offset: wgt::BufferAddress, ) { - if let Err(cause) = - self.0 - .render_pass_draw_indirect(&mut pass_data.pass, *indirect_buffer, indirect_offset) + if let Err(cause) = pass_data + .pass + .draw_indirect(&self.0, *indirect_buffer, indirect_offset) { self.handle_error( &pass_data.error_sink, @@ -3000,11 +3002,11 @@ impl crate::Context for ContextWgpuCore { _indirect_buffer_data: &Self::BufferData, indirect_offset: wgt::BufferAddress, ) { - if let Err(cause) = self.0.render_pass_draw_indexed_indirect( - &mut pass_data.pass, - *indirect_buffer, - indirect_offset, - ) { + if let Err(cause) = + pass_data + .pass + .draw_indexed_indirect(&self.0, *indirect_buffer, indirect_offset) + { self.handle_error( &pass_data.error_sink, cause, @@ -3024,12 +3026,11 @@ impl crate::Context for ContextWgpuCore { indirect_offset: wgt::BufferAddress, count: u32, ) { - if let Err(cause) = self.0.render_pass_multi_draw_indirect( - &mut pass_data.pass, - *indirect_buffer, - indirect_offset, - count, - ) { + if let Err(cause) = + pass_data + .pass + .multi_draw_indirect(&self.0, *indirect_buffer, indirect_offset, count) + { self.handle_error( &pass_data.error_sink, cause, @@ -3049,8 +3050,8 @@ impl crate::Context for ContextWgpuCore { indirect_offset: wgt::BufferAddress, count: u32, ) { - if let Err(cause) = self.0.render_pass_multi_draw_indexed_indirect( - &mut pass_data.pass, + if let Err(cause) = pass_data.pass.multi_draw_indexed_indirect( + &self.0, *indirect_buffer, indirect_offset, count, @@ -3077,8 +3078,8 @@ impl crate::Context for ContextWgpuCore { count_buffer_offset: wgt::BufferAddress, max_count: u32, ) { - if let Err(cause) = self.0.render_pass_multi_draw_indirect_count( - &mut pass_data.pass, + if let Err(cause) = pass_data.pass.multi_draw_indirect_count( + &self.0, *indirect_buffer, indirect_offset, *count_buffer, @@ -3107,8 +3108,8 @@ impl crate::Context for ContextWgpuCore { count_buffer_offset: wgt::BufferAddress, max_count: u32, ) { - if let Err(cause) = self.0.render_pass_multi_draw_indexed_indirect_count( - &mut pass_data.pass, + if let Err(cause) = pass_data.pass.multi_draw_indexed_indirect_count( + &self.0, *indirect_buffer, indirect_offset, *count_buffer, @@ -3131,10 +3132,7 @@ impl crate::Context for ContextWgpuCore { pass_data: &mut Self::RenderPassData, color: wgt::Color, ) { - if let Err(cause) = self - .0 - .render_pass_set_blend_constant(&mut pass_data.pass, &color) - { + if let Err(cause) = pass_data.pass.set_blend_constant(&self.0, color) { self.handle_error( &pass_data.error_sink, cause, @@ -3154,9 +3152,9 @@ impl crate::Context for ContextWgpuCore { width: u32, height: u32, ) { - if let Err(cause) = - self.0 - .render_pass_set_scissor_rect(&mut pass_data.pass, x, y, width, height) + if let Err(cause) = pass_data + .pass + .set_scissor_rect(&self.0, x, y, width, height) { self.handle_error( &pass_data.error_sink, @@ -3179,15 +3177,10 @@ impl crate::Context for ContextWgpuCore { min_depth: f32, max_depth: f32, ) { - if let Err(cause) = self.0.render_pass_set_viewport( - &mut pass_data.pass, - x, - y, - width, - height, - min_depth, - max_depth, - ) { + if let Err(cause) = pass_data + .pass + .set_viewport(&self.0, x, y, width, height, min_depth, max_depth) + { self.handle_error( &pass_data.error_sink, cause, @@ -3204,10 +3197,7 @@ impl crate::Context for ContextWgpuCore { pass_data: &mut Self::RenderPassData, reference: u32, ) { - if let Err(cause) = self - .0 - .render_pass_set_stencil_reference(&mut pass_data.pass, reference) - { + if let Err(cause) = pass_data.pass.set_stencil_reference(&self.0, reference) { self.handle_error( &pass_data.error_sink, cause, @@ -3224,10 +3214,7 @@ impl crate::Context for ContextWgpuCore { pass_data: &mut Self::RenderPassData, label: &str, ) { - if let Err(cause) = self - .0 - .render_pass_insert_debug_marker(&mut pass_data.pass, label, 0) - { + if let Err(cause) = pass_data.pass.insert_debug_marker(&self.0, label, 0) { self.handle_error( &pass_data.error_sink, cause, @@ -3244,10 +3231,7 @@ impl crate::Context for ContextWgpuCore { pass_data: &mut Self::RenderPassData, group_label: &str, ) { - if let Err(cause) = self - .0 - .render_pass_push_debug_group(&mut pass_data.pass, group_label, 0) - { + if let Err(cause) = pass_data.pass.push_debug_group(&self.0, group_label, 0) { self.handle_error( &pass_data.error_sink, cause, @@ -3263,7 +3247,7 @@ impl crate::Context for ContextWgpuCore { _pass: &mut Self::RenderPassId, pass_data: &mut Self::RenderPassData, ) { - if let Err(cause) = self.0.render_pass_pop_debug_group(&mut pass_data.pass) { + if let Err(cause) = pass_data.pass.pop_debug_group(&self.0) { self.handle_error( &pass_data.error_sink, cause, @@ -3282,9 +3266,9 @@ impl crate::Context for ContextWgpuCore { _query_set_data: &Self::QuerySetData, query_index: u32, ) { - if let Err(cause) = - self.0 - .render_pass_write_timestamp(&mut pass_data.pass, *query_set, query_index) + if let Err(cause) = pass_data + .pass + .write_timestamp(&self.0, *query_set, query_index) { self.handle_error( &pass_data.error_sink, @@ -3302,10 +3286,7 @@ impl crate::Context for ContextWgpuCore { pass_data: &mut Self::RenderPassData, query_index: u32, ) { - if let Err(cause) = self - .0 - .render_pass_begin_occlusion_query(&mut pass_data.pass, query_index) - { + if let Err(cause) = pass_data.pass.begin_occlusion_query(&self.0, query_index) { self.handle_error( &pass_data.error_sink, cause, @@ -3321,7 +3302,7 @@ impl crate::Context for ContextWgpuCore { _pass: &mut Self::RenderPassId, pass_data: &mut Self::RenderPassData, ) { - if let Err(cause) = self.0.render_pass_end_occlusion_query(&mut pass_data.pass) { + if let Err(cause) = pass_data.pass.end_occlusion_query(&self.0) { self.handle_error( &pass_data.error_sink, cause, @@ -3340,11 +3321,11 @@ impl crate::Context for ContextWgpuCore { _query_set_data: &Self::QuerySetData, query_index: u32, ) { - if let Err(cause) = self.0.render_pass_begin_pipeline_statistics_query( - &mut pass_data.pass, - *query_set, - query_index, - ) { + if let Err(cause) = + pass_data + .pass + .begin_pipeline_statistics_query(&self.0, *query_set, query_index) + { self.handle_error( &pass_data.error_sink, cause, @@ -3360,10 +3341,7 @@ impl crate::Context for ContextWgpuCore { _pass: &mut Self::RenderPassId, pass_data: &mut Self::RenderPassData, ) { - if let Err(cause) = self - .0 - .render_pass_end_pipeline_statistics_query(&mut pass_data.pass) - { + if let Err(cause) = pass_data.pass.end_pipeline_statistics_query(&self.0) { self.handle_error( &pass_data.error_sink, cause, @@ -3381,9 +3359,9 @@ impl crate::Context for ContextWgpuCore { render_bundles: &mut dyn Iterator, ) { let temp_render_bundles = render_bundles.map(|(i, _)| i).collect::>(); - if let Err(cause) = self - .0 - .render_pass_execute_bundles(&mut pass_data.pass, &temp_render_bundles) + if let Err(cause) = pass_data + .pass + .execute_bundles(&self.0, &temp_render_bundles) { self.handle_error( &pass_data.error_sink, @@ -3400,9 +3378,7 @@ impl crate::Context for ContextWgpuCore { _pass: &mut Self::RenderPassId, pass_data: &mut Self::RenderPassData, ) { - let encoder = pass_data.pass.parent_id(); - if let Err(cause) = wgc::gfx_select!(encoder => self.0.render_pass_end(&mut pass_data.pass)) - { + if let Err(cause) = pass_data.pass.end(&self.0) { self.handle_error( &pass_data.error_sink, cause, From be4ed826d96964b546801c5b3796984a901b6cf2 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sat, 29 Jun 2024 14:07:50 +0200 Subject: [PATCH 06/15] Use of dynrenderpass in deno --- deno_webgpu/command_encoder.rs | 7 ++- deno_webgpu/render_pass.rs | 111 ++++++++++++++++----------------- 2 files changed, 58 insertions(+), 60 deletions(-) diff --git a/deno_webgpu/command_encoder.rs b/deno_webgpu/command_encoder.rs index 177cea28c7..ba21bb05b5 100644 --- a/deno_webgpu/command_encoder.rs +++ b/deno_webgpu/command_encoder.rs @@ -200,6 +200,8 @@ pub fn op_webgpu_command_encoder_begin_render_pass( .transpose()? .map(|query_set| query_set.1); + let instance = state.borrow::(); + let command_encoder = &command_encoder_resource.1; let descriptor = wgpu_core::command::RenderPassDescriptor { label: Some(label), color_attachments: Cow::from(color_attachments), @@ -208,15 +210,14 @@ pub fn op_webgpu_command_encoder_begin_render_pass( occlusion_query_set: occlusion_query_set_resource, }; - let render_pass = wgpu_core::command::RenderPass::new(command_encoder_resource.1, &descriptor); - + let (render_pass, error) = gfx_select!(command_encoder => instance.command_encoder_create_render_pass_dyn(*command_encoder, &descriptor)); let rid = state .resource_table .add(super::render_pass::WebGpuRenderPass(RefCell::new( render_pass, ))); - Ok(WebGpuResult::rid(rid)) + Ok(WebGpuResult::rid_err(rid, error)) } #[derive(Deserialize)] diff --git a/deno_webgpu/render_pass.rs b/deno_webgpu/render_pass.rs index 5b08925803..941245971c 100644 --- a/deno_webgpu/render_pass.rs +++ b/deno_webgpu/render_pass.rs @@ -9,11 +9,10 @@ use deno_core::ResourceId; use serde::Deserialize; use std::borrow::Cow; use std::cell::RefCell; -use wgpu_core::global::Global; use super::error::WebGpuResult; -pub(crate) struct WebGpuRenderPass(pub(crate) RefCell); +pub(crate) struct WebGpuRenderPass(pub(crate) RefCell>); impl Resource for WebGpuRenderPass { fn name(&self) -> Cow { "webGPURenderPass".into() @@ -42,8 +41,8 @@ pub fn op_webgpu_render_pass_set_viewport( .resource_table .get::(args.render_pass_rid)?; - state.borrow::().render_pass_set_viewport( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().set_viewport( + state.borrow(), args.x, args.y, args.width, @@ -69,13 +68,10 @@ pub fn op_webgpu_render_pass_set_scissor_rect( .resource_table .get::(render_pass_rid)?; - state.borrow::().render_pass_set_scissor_rect( - &mut render_pass_resource.0.borrow_mut(), - x, - y, - width, - height, - )?; + render_pass_resource + .0 + .borrow_mut() + .set_scissor_rect(state.borrow(), x, y, width, height)?; Ok(WebGpuResult::empty()) } @@ -91,9 +87,10 @@ pub fn op_webgpu_render_pass_set_blend_constant( .resource_table .get::(render_pass_rid)?; - state - .borrow::() - .render_pass_set_blend_constant(&mut render_pass_resource.0.borrow_mut(), &color)?; + render_pass_resource + .0 + .borrow_mut() + .set_blend_constant(state.borrow(), color)?; Ok(WebGpuResult::empty()) } @@ -109,9 +106,10 @@ pub fn op_webgpu_render_pass_set_stencil_reference( .resource_table .get::(render_pass_rid)?; - state - .borrow::() - .render_pass_set_stencil_reference(&mut render_pass_resource.0.borrow_mut(), reference)?; + render_pass_resource + .0 + .borrow_mut() + .set_stencil_reference(state.borrow(), reference)?; Ok(WebGpuResult::empty()) } @@ -127,9 +125,10 @@ pub fn op_webgpu_render_pass_begin_occlusion_query( .resource_table .get::(render_pass_rid)?; - state - .borrow::() - .render_pass_begin_occlusion_query(&mut render_pass_resource.0.borrow_mut(), query_index)?; + render_pass_resource + .0 + .borrow_mut() + .begin_occlusion_query(state.borrow(), query_index)?; Ok(WebGpuResult::empty()) } @@ -144,9 +143,10 @@ pub fn op_webgpu_render_pass_end_occlusion_query( .resource_table .get::(render_pass_rid)?; - state - .borrow::() - .render_pass_end_occlusion_query(&mut render_pass_resource.0.borrow_mut())?; + render_pass_resource + .0 + .borrow_mut() + .end_occlusion_query(state.borrow())?; Ok(WebGpuResult::empty()) } @@ -172,9 +172,10 @@ pub fn op_webgpu_render_pass_execute_bundles( .resource_table .get::(render_pass_rid)?; - state - .borrow::() - .render_pass_execute_bundles(&mut render_pass_resource.0.borrow_mut(), &bundles)?; + render_pass_resource + .0 + .borrow_mut() + .execute_bundles(state.borrow(), &bundles)?; Ok(WebGpuResult::empty()) } @@ -189,12 +190,7 @@ pub fn op_webgpu_render_pass_end( .resource_table .take::(render_pass_rid)?; - // TODO: Just like parent_id ComputePass, there's going to be DynComputePass soon which will eliminate the need of doing gfx_select here. - let instance = state.borrow::(); - let parent_id = render_pass_resource.0.borrow().parent_id(); - gfx_select!(parent_id => instance.render_pass_end( - &mut render_pass_resource.0.borrow_mut() - ))?; + render_pass_resource.0.borrow_mut().end(state.borrow())?; Ok(WebGpuResult::empty()) } @@ -226,8 +222,8 @@ pub fn op_webgpu_render_pass_set_bind_group( let dynamic_offsets_data: &[u32] = &dynamic_offsets_data[start..start + len]; - state.borrow::().render_pass_set_bind_group( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().set_bind_group( + state.borrow(), index, bind_group_resource.1, dynamic_offsets_data, @@ -247,8 +243,8 @@ pub fn op_webgpu_render_pass_push_debug_group( .resource_table .get::(render_pass_rid)?; - state.borrow::().render_pass_push_debug_group( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().push_debug_group( + state.borrow(), group_label, 0, // wgpu#975 )?; @@ -266,9 +262,10 @@ pub fn op_webgpu_render_pass_pop_debug_group( .resource_table .get::(render_pass_rid)?; - state - .borrow::() - .render_pass_pop_debug_group(&mut render_pass_resource.0.borrow_mut())?; + render_pass_resource + .0 + .borrow_mut() + .pop_debug_group(state.borrow())?; Ok(WebGpuResult::empty()) } @@ -284,8 +281,8 @@ pub fn op_webgpu_render_pass_insert_debug_marker( .resource_table .get::(render_pass_rid)?; - state.borrow::().render_pass_insert_debug_marker( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().insert_debug_marker( + state.borrow(), marker_label, 0, // wgpu#975 )?; @@ -307,10 +304,10 @@ pub fn op_webgpu_render_pass_set_pipeline( .resource_table .get::(render_pass_rid)?; - state.borrow::().render_pass_set_pipeline( - &mut render_pass_resource.0.borrow_mut(), - render_pipeline_resource.1, - )?; + render_pass_resource + .0 + .borrow_mut() + .set_pipeline(state.borrow(), render_pipeline_resource.1)?; Ok(WebGpuResult::empty()) } @@ -341,8 +338,8 @@ pub fn op_webgpu_render_pass_set_index_buffer( None }; - state.borrow::().render_pass_set_index_buffer( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().set_index_buffer( + state.borrow(), buffer_resource.1, index_format, offset, @@ -378,8 +375,8 @@ pub fn op_webgpu_render_pass_set_vertex_buffer( None }; - state.borrow::().render_pass_set_vertex_buffer( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().set_vertex_buffer( + state.borrow(), slot, buffer_resource.1, offset, @@ -403,8 +400,8 @@ pub fn op_webgpu_render_pass_draw( .resource_table .get::(render_pass_rid)?; - state.borrow::().render_pass_draw( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().draw( + state.borrow(), vertex_count, instance_count, first_vertex, @@ -429,8 +426,8 @@ pub fn op_webgpu_render_pass_draw_indexed( .resource_table .get::(render_pass_rid)?; - state.borrow::().render_pass_draw_indexed( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().draw_indexed( + state.borrow(), index_count, instance_count, first_index, @@ -456,8 +453,8 @@ pub fn op_webgpu_render_pass_draw_indirect( .resource_table .get::(render_pass_rid)?; - state.borrow::().render_pass_draw_indirect( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().draw_indirect( + state.borrow(), buffer_resource.1, indirect_offset, )?; @@ -480,8 +477,8 @@ pub fn op_webgpu_render_pass_draw_indexed_indirect( .resource_table .get::(render_pass_rid)?; - state.borrow::().render_pass_draw_indexed_indirect( - &mut render_pass_resource.0.borrow_mut(), + render_pass_resource.0.borrow_mut().draw_indexed_indirect( + state.borrow(), buffer_resource.1, indirect_offset, )?; From 2ebdaf6948567a80071f2d4f70ac0f15ec720ee7 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sat, 29 Jun 2024 13:54:51 +0200 Subject: [PATCH 07/15] Separate active occlusion & pipeline statitics query --- wgpu-core/src/command/render.rs | 21 ++++++++++++++------- 1 file changed, 14 insertions(+), 7 deletions(-) diff --git a/wgpu-core/src/command/render.rs b/wgpu-core/src/command/render.rs index 6565b05264..206602141d 100644 --- a/wgpu-core/src/command/render.rs +++ b/wgpu-core/src/command/render.rs @@ -477,7 +477,9 @@ struct State<'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A: HalApi> { temp_offsets: Vec, dynamic_offset_count: usize, string_offset: usize, - active_query: Option<(Arc>, u32)>, + + active_occlusion_query: Option<(Arc>, u32)>, + active_pipeline_statistics_query: Option<(Arc>, u32)>, } impl<'scope, 'snatch_guard, 'cmd_buf, 'raw_encoder, A: HalApi> @@ -1697,7 +1699,9 @@ impl Global { temp_offsets: Vec::new(), dynamic_offset_count: 0, string_offset: 0, - active_query: None, + + active_occlusion_query: None, + active_pipeline_statistics_query: None, }; for command in base.commands { @@ -1896,7 +1900,7 @@ impl Global { &mut state.tracker.query_sets, query_index, Some(&mut cmd_buf_data.pending_query_resets), - &mut state.active_query, + &mut state.active_occlusion_query, ) .map_pass_err(scope)?; } @@ -1904,7 +1908,7 @@ impl Global { api_log!("RenderPass::end_occlusion_query"); let scope = PassErrorScope::EndOcclusionQuery; - end_occlusion_query(state.raw_encoder, &mut state.active_query) + end_occlusion_query(state.raw_encoder, &mut state.active_occlusion_query) .map_pass_err(scope)?; } ArcRenderCommand::BeginPipelineStatisticsQuery { @@ -1924,7 +1928,7 @@ impl Global { cmd_buf.as_ref(), query_index, Some(&mut cmd_buf_data.pending_query_resets), - &mut state.active_query, + &mut state.active_pipeline_statistics_query, ) .map_pass_err(scope)?; } @@ -1932,8 +1936,11 @@ impl Global { api_log!("RenderPass::end_pipeline_statistics_query"); let scope = PassErrorScope::EndPipelineStatisticsQuery; - end_pipeline_statistics_query(state.raw_encoder, &mut state.active_query) - .map_pass_err(scope)?; + end_pipeline_statistics_query( + state.raw_encoder, + &mut state.active_pipeline_statistics_query, + ) + .map_pass_err(scope)?; } ArcRenderCommand::ExecuteBundle(bundle) => { let scope = PassErrorScope::ExecuteBundle; From cdd623ad802d1a6a21892dcdd4eac7ce3f28529e Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sat, 29 Jun 2024 13:18:10 +0200 Subject: [PATCH 08/15] resolve render/compute command is now behind `replay` feature --- wgpu-core/src/command/compute.rs | 8 +++++--- wgpu-core/src/command/compute_command.rs | 10 ++++------ wgpu-core/src/command/render.rs | 7 ++++--- wgpu-core/src/command/render_command.rs | 15 +++++++-------- 4 files changed, 20 insertions(+), 20 deletions(-) diff --git a/wgpu-core/src/command/compute.rs b/wgpu-core/src/command/compute.rs index 36b2413e68..5636bf6a5a 100644 --- a/wgpu-core/src/command/compute.rs +++ b/wgpu-core/src/command/compute.rs @@ -4,7 +4,7 @@ use crate::{ }, command::{ bind::Binder, - compute_command::{ArcComputeCommand, ComputeCommand}, + compute_command::ArcComputeCommand, end_pipeline_statistics_query, memory_init::{fixup_discarded_surfaces, SurfacesInDiscardState}, validate_and_begin_pipeline_statistics_query, ArcPassTimestampWrites, BasePass, @@ -405,17 +405,19 @@ impl Global { } #[doc(hidden)] + #[cfg(feature = "replay")] pub fn compute_pass_end_with_unresolved_commands( &self, encoder_id: id::CommandEncoderId, - base: BasePass, + base: BasePass, timestamp_writes: Option<&PassTimestampWrites>, ) -> Result<(), ComputePassError> { let hub = A::hub(self); let scope = PassErrorScope::PassEncoder(encoder_id); let cmd_buf = CommandBuffer::get_encoder(hub, encoder_id).map_pass_err(scope)?; - let commands = ComputeCommand::resolve_compute_command_ids(A::hub(self), &base.commands)?; + let commands = + super::ComputeCommand::resolve_compute_command_ids(A::hub(self), &base.commands)?; let timestamp_writes = if let Some(tw) = timestamp_writes { Some(ArcPassTimestampWrites { diff --git a/wgpu-core/src/command/compute_command.rs b/wgpu-core/src/command/compute_command.rs index eb8ce9fa34..aa39a309b5 100644 --- a/wgpu-core/src/command/compute_command.rs +++ b/wgpu-core/src/command/compute_command.rs @@ -8,8 +8,6 @@ use crate::{ resource::{Buffer, QuerySet}, }; -use super::{ComputePassError, ComputePassErrorInner, PassErrorScope}; - #[derive(Clone, Copy, Debug)] #[cfg_attr(feature = "serde", derive(serde::Serialize, serde::Deserialize))] pub enum ComputeCommand { @@ -72,13 +70,13 @@ pub enum ComputeCommand { impl ComputeCommand { /// Resolves all ids in a list of commands into the corresponding resource Arc. - // - // TODO: Once resolving is done on-the-fly during recording, this function should be only needed with the replay feature: - // #[cfg(feature = "replay")] + #[cfg(feature = "replay")] pub fn resolve_compute_command_ids( hub: &crate::hub::Hub, commands: &[ComputeCommand], - ) -> Result>, ComputePassError> { + ) -> Result>, super::ComputePassError> { + use super::{ComputePassError, ComputePassErrorInner, PassErrorScope}; + let buffers_guard = hub.buffers.read(); let bind_group_guard = hub.bind_groups.read(); let query_set_guard = hub.query_sets.read(); diff --git a/wgpu-core/src/command/render.rs b/wgpu-core/src/command/render.rs index 206602141d..048dda0d22 100644 --- a/wgpu-core/src/command/render.rs +++ b/wgpu-core/src/command/render.rs @@ -51,7 +51,7 @@ use serde::Serialize; use std::sync::Arc; use std::{borrow::Cow, fmt, iter, mem, num::NonZeroU32, ops::Range, str}; -use super::render_command::{ArcRenderCommand, RenderCommand}; +use super::render_command::ArcRenderCommand; use super::{ memory_init::TextureSurfaceDiscard, CommandBufferTextureMemoryActions, CommandEncoder, QueryResetMap, @@ -1496,10 +1496,11 @@ impl Global { } #[doc(hidden)] + #[cfg(feature = "replay")] pub fn render_pass_end_with_unresolved_commands( &self, encoder_id: id::CommandEncoderId, - base: BasePass, + base: BasePass, color_attachments: &[Option], depth_stencil_attachment: Option<&RenderPassDepthStencilAttachment>, timestamp_writes: Option<&PassTimestampWrites>, @@ -1533,7 +1534,7 @@ impl Global { let hub = A::hub(self); render_pass.base = Some(BasePass { label, - commands: RenderCommand::resolve_render_command_ids(hub, &commands)?, + commands: super::RenderCommand::resolve_render_command_ids(hub, &commands)?, dynamic_offsets, string_data, push_constant_data, diff --git a/wgpu-core/src/command/render_command.rs b/wgpu-core/src/command/render_command.rs index 3140b78e68..ad0dbaa505 100644 --- a/wgpu-core/src/command/render_command.rs +++ b/wgpu-core/src/command/render_command.rs @@ -9,10 +9,7 @@ use wgt::{BufferAddress, BufferSize, Color}; use std::{num::NonZeroU32, sync::Arc}; -use super::{ - DrawKind, PassErrorScope, Rect, RenderBundle, RenderCommandError, RenderPassError, - RenderPassErrorInner, -}; +use super::{Rect, RenderBundle}; #[doc(hidden)] #[derive(Clone, Copy, Debug)] @@ -128,13 +125,15 @@ pub enum RenderCommand { impl RenderCommand { /// Resolves all ids in a list of commands into the corresponding resource Arc. - // - // TODO: Once resolving is done on-the-fly during recording, this function should be only needed with the replay feature: - // #[cfg(feature = "replay")] + #[cfg(feature = "replay")] pub fn resolve_render_command_ids( hub: &crate::hub::Hub, commands: &[RenderCommand], - ) -> Result>, RenderPassError> { + ) -> Result>, super::RenderPassError> { + use super::{ + DrawKind, PassErrorScope, RenderCommandError, RenderPassError, RenderPassErrorInner, + }; + let buffers_guard = hub.buffers.read(); let bind_group_guard = hub.bind_groups.read(); let query_set_guard = hub.query_sets.read(); From 671ec6f365dedb34ca3d1ddada7a5ece0c27ac46 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sun, 16 Jun 2024 11:23:05 +0200 Subject: [PATCH 09/15] add vertex & index buffer to ownership test --- tests/tests/render_pass_ownership.rs | 37 +++++++++++++++++++++++++--- 1 file changed, 33 insertions(+), 4 deletions(-) diff --git a/tests/tests/render_pass_ownership.rs b/tests/tests/render_pass_ownership.rs index 192bbad7bb..cb437ee31e 100644 --- a/tests/tests/render_pass_ownership.rs +++ b/tests/tests/render_pass_ownership.rs @@ -2,8 +2,6 @@ //! I.e. once a resource is passed in to a render pass, it can be dropped. //! //! TODO: Methods that take resources that weren't tested here: -//! * rpass.set_index_buffer(buffer_slice, index_format) -//! * rpass.set_vertex_buffer(slot, buffer_slice) //! * rpass.draw_indexed_indirect(indirect_buffer, indirect_offset) //! * rpass.execute_bundles(render_bundles) //! * rpass.multi_draw_indirect(indirect_buffer, indirect_offset, count) @@ -51,6 +49,8 @@ async fn render_pass_resource_ownership(ctx: TestingContext) { cpu_buffer, buffer_size, indirect_buffer, + vertex_buffer, + index_buffer, bind_group, pipeline, color_attachment_view, @@ -89,12 +89,16 @@ async fn render_pass_resource_ownership(ctx: TestingContext) { rpass.set_pipeline(&pipeline); rpass.set_bind_group(0, &bind_group, &[]); + rpass.set_vertex_buffer(0, vertex_buffer.slice(..)); + rpass.set_index_buffer(index_buffer.slice(..), wgpu::IndexFormat::Uint32); rpass.draw_indirect(&indirect_buffer, 0); // Now drop all resources we set. Then do a device poll to make sure the resources are really not dropped too early, no matter what. drop(pipeline); drop(bind_group); drop(indirect_buffer); + drop(vertex_buffer); + drop(index_buffer); ctx.async_poll(wgpu::Maintain::wait()) .await .panic_on_timeout(); @@ -134,6 +138,8 @@ struct ResourceSetup { buffer_size: u64, indirect_buffer: wgpu::Buffer, + vertex_buffer: wgpu::Buffer, + index_buffer: wgpu::Buffer, bind_group: wgpu::BindGroup, pipeline: wgpu::RenderPipeline, @@ -183,13 +189,14 @@ fn resource_setup(ctx: &TestingContext) -> ResourceSetup { mapped_at_creation: false, }); + let vertex_count = 3; let indirect_buffer = ctx .device .create_buffer_init(&wgpu::util::BufferInitDescriptor { label: Some("gpu_buffer"), usage: wgpu::BufferUsages::INDIRECT, contents: wgpu::util::DrawIndirectArgs { - vertex_count: 3, + vertex_count, instance_count: 1, first_vertex: 0, first_instance: 0, @@ -197,6 +204,21 @@ fn resource_setup(ctx: &TestingContext) -> ResourceSetup { .as_bytes(), }); + let vertex_buffer = ctx.device.create_buffer(&wgpu::BufferDescriptor { + label: Some("vertex_buffer"), + usage: wgpu::BufferUsages::VERTEX, + size: std::mem::size_of::() as u64 * vertex_count as u64, + mapped_at_creation: false, + }); + + let index_buffer = ctx + .device + .create_buffer_init(&wgpu::util::BufferInitDescriptor { + label: Some("vertex_buffer"), + usage: wgpu::BufferUsages::INDEX, + contents: bytemuck::cast_slice(&[0_u32, 1, 2]), + }); + let bind_group = ctx.device.create_bind_group(&wgpu::BindGroupDescriptor { label: Some("bind_group"), layout: &bgl, @@ -261,7 +283,11 @@ fn resource_setup(ctx: &TestingContext) -> ResourceSetup { module: &sm, entry_point: "vs_main", compilation_options: Default::default(), - buffers: &[], + buffers: &[wgpu::VertexBufferLayout { + array_stride: 4, + step_mode: wgpu::VertexStepMode::Vertex, + attributes: &wgpu::vertex_attr_array![0 => Uint32], + }], }, fragment: Some(wgpu::FragmentState { module: &sm, @@ -294,7 +320,10 @@ fn resource_setup(ctx: &TestingContext) -> ResourceSetup { gpu_buffer, cpu_buffer, buffer_size, + indirect_buffer, + vertex_buffer, + index_buffer, bind_group, pipeline, From 14edc8e1d2e31f9ea71475b07919fb4194f2e32a Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sun, 16 Jun 2024 11:25:59 +0200 Subject: [PATCH 10/15] test for pipeline statistics query --- tests/tests/render_pass_ownership.rs | 75 +++++++++++++++++++++++++++- 1 file changed, 74 insertions(+), 1 deletion(-) diff --git a/tests/tests/render_pass_ownership.rs b/tests/tests/render_pass_ownership.rs index cb437ee31e..37c7d090ff 100644 --- a/tests/tests/render_pass_ownership.rs +++ b/tests/tests/render_pass_ownership.rs @@ -8,7 +8,6 @@ //! * rpass.multi_draw_indexed_indirect(indirect_buffer, indirect_offset, count) //! * rpass.multi_draw_indirect_count //! * rpass.multi_draw_indexed_indirect_count -//! * rpass.begin_pipeline_statistics_query //! * rpass.write_timestamp use std::num::NonZeroU64; @@ -107,6 +106,80 @@ async fn render_pass_resource_ownership(ctx: TestingContext) { assert_render_pass_executed_normally(encoder, gpu_buffer, cpu_buffer, buffer_size, ctx).await; } +#[gpu_test] +static RENDER_PASS_QUERY_SET_OWNERSHIP_PIPELINE_STATISTICS: GpuTestConfiguration = + GpuTestConfiguration::new() + .parameters( + TestParameters::default() + .test_features_limits() + .features(wgpu::Features::PIPELINE_STATISTICS_QUERY), + ) + .run_async(render_pass_query_set_ownership_pipeline_statistics); + +async fn render_pass_query_set_ownership_pipeline_statistics(ctx: TestingContext) { + let ResourceSetup { + gpu_buffer, + cpu_buffer, + buffer_size, + indirect_buffer: _, + vertex_buffer, + index_buffer, + bind_group, + pipeline, + color_attachment_view, + color_attachment_resolve_view: _, + depth_stencil_view, + } = resource_setup(&ctx); + + let query_set = ctx.device.create_query_set(&wgpu::QuerySetDescriptor { + label: Some("query_set"), + ty: wgpu::QueryType::PipelineStatistics( + wgpu::PipelineStatisticsTypes::COMPUTE_SHADER_INVOCATIONS, + ), + count: 1, + }); + + let mut encoder = ctx + .device + .create_command_encoder(&wgpu::CommandEncoderDescriptor::default()); + + { + let mut rpass = encoder.begin_render_pass(&wgpu::RenderPassDescriptor { + label: Some("render_pass"), + color_attachments: &[Some(wgpu::RenderPassColorAttachment { + view: &color_attachment_view, + resolve_target: None, + ops: wgpu::Operations::default(), + })], + depth_stencil_attachment: Some(wgpu::RenderPassDepthStencilAttachment { + view: &depth_stencil_view, + depth_ops: Some(wgpu::Operations { + load: wgpu::LoadOp::Clear(1.0), + store: wgpu::StoreOp::Store, + }), + stencil_ops: None, + }), + timestamp_writes: None, + occlusion_query_set: None, + }); + rpass.set_pipeline(&pipeline); + rpass.set_bind_group(0, &bind_group, &[]); + rpass.set_vertex_buffer(0, vertex_buffer.slice(..)); + rpass.set_index_buffer(index_buffer.slice(..), wgpu::IndexFormat::Uint32); + rpass.begin_pipeline_statistics_query(&query_set, 0); + rpass.draw(0..3, 0..1); + rpass.end_pipeline_statistics_query(); + + // Drop the query set. Then do a device poll to make sure it's not dropped too early, no matter what. + drop(query_set); + ctx.async_poll(wgpu::Maintain::wait()) + .await + .panic_on_timeout(); + } + + assert_render_pass_executed_normally(encoder, gpu_buffer, cpu_buffer, buffer_size, ctx).await; +} + async fn assert_render_pass_executed_normally( mut encoder: wgpu::CommandEncoder, gpu_buffer: wgpu::Buffer, From 4db260ee73dfa8290d702f35f9337cf6a5d94dca Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sun, 16 Jun 2024 11:28:34 +0200 Subject: [PATCH 11/15] add occlusion query set to pass resource test --- tests/tests/render_pass_ownership.rs | 15 ++++++++++++++- 1 file changed, 14 insertions(+), 1 deletion(-) diff --git a/tests/tests/render_pass_ownership.rs b/tests/tests/render_pass_ownership.rs index 37c7d090ff..9e47897330 100644 --- a/tests/tests/render_pass_ownership.rs +++ b/tests/tests/render_pass_ownership.rs @@ -55,6 +55,7 @@ async fn render_pass_resource_ownership(ctx: TestingContext) { color_attachment_view, color_attachment_resolve_view, depth_stencil_view, + occlusion_query_set, } = resource_setup(&ctx); let mut encoder = ctx @@ -78,7 +79,7 @@ async fn render_pass_resource_ownership(ctx: TestingContext) { stencil_ops: None, }), timestamp_writes: None, - occlusion_query_set: None, + occlusion_query_set: Some(&occlusion_query_set), }); // Drop render pass attachments right away. @@ -90,7 +91,9 @@ async fn render_pass_resource_ownership(ctx: TestingContext) { rpass.set_bind_group(0, &bind_group, &[]); rpass.set_vertex_buffer(0, vertex_buffer.slice(..)); rpass.set_index_buffer(index_buffer.slice(..), wgpu::IndexFormat::Uint32); + rpass.begin_occlusion_query(0); rpass.draw_indirect(&indirect_buffer, 0); + rpass.end_occlusion_query(); // Now drop all resources we set. Then do a device poll to make sure the resources are really not dropped too early, no matter what. drop(pipeline); @@ -98,6 +101,7 @@ async fn render_pass_resource_ownership(ctx: TestingContext) { drop(indirect_buffer); drop(vertex_buffer); drop(index_buffer); + drop(occlusion_query_set); ctx.async_poll(wgpu::Maintain::wait()) .await .panic_on_timeout(); @@ -129,6 +133,7 @@ async fn render_pass_query_set_ownership_pipeline_statistics(ctx: TestingContext color_attachment_view, color_attachment_resolve_view: _, depth_stencil_view, + occlusion_query_set: _, } = resource_setup(&ctx); let query_set = ctx.device.create_query_set(&wgpu::QuerySetDescriptor { @@ -219,6 +224,7 @@ struct ResourceSetup { color_attachment_view: wgpu::TextureView, color_attachment_resolve_view: wgpu::TextureView, depth_stencil_view: wgpu::TextureView, + occlusion_query_set: wgpu::QuerySet, } fn resource_setup(ctx: &TestingContext) -> ResourceSetup { @@ -347,6 +353,12 @@ fn resource_setup(ctx: &TestingContext) -> ResourceSetup { }); let depth_stencil_view = depth_stencil.create_view(&wgpu::TextureViewDescriptor::default()); + let occlusion_query_set = ctx.device.create_query_set(&wgpu::QuerySetDescriptor { + label: Some("occ_query_set"), + ty: wgpu::QueryType::Occlusion, + count: 1, + }); + let pipeline = ctx .device .create_render_pipeline(&wgpu::RenderPipelineDescriptor { @@ -403,5 +415,6 @@ fn resource_setup(ctx: &TestingContext) -> ResourceSetup { color_attachment_view, color_attachment_resolve_view, depth_stencil_view, + occlusion_query_set, } } From fb2c42b224eecbd7724263e6331dca2f5e53b9d7 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Mon, 24 Jun 2024 23:56:41 +0200 Subject: [PATCH 12/15] add tests for resource ownership of render pass query timestamps --- tests/tests/compute_pass_ownership.rs | 6 +- tests/tests/render_pass_ownership.rs | 92 +++++++++++++++++++++++---- 2 files changed, 81 insertions(+), 17 deletions(-) diff --git a/tests/tests/compute_pass_ownership.rs b/tests/tests/compute_pass_ownership.rs index 459dbe64e2..5c0971c6d9 100644 --- a/tests/tests/compute_pass_ownership.rs +++ b/tests/tests/compute_pass_ownership.rs @@ -111,14 +111,14 @@ async fn compute_pass_query_set_ownership_pipeline_statistics(ctx: TestingContex } #[gpu_test] -static COMPUTE_PASS_QUERY_TIMESTAMPS: GpuTestConfiguration = +static COMPUTE_PASS_QUERY_SET_OWNERSHIP_TIMESTAMPS: GpuTestConfiguration = GpuTestConfiguration::new() .parameters(TestParameters::default().test_features_limits().features( wgpu::Features::TIMESTAMP_QUERY | wgpu::Features::TIMESTAMP_QUERY_INSIDE_PASSES, )) - .run_async(compute_pass_query_timestamps); + .run_async(compute_pass_query_set_ownership_timestamps); -async fn compute_pass_query_timestamps(ctx: TestingContext) { +async fn compute_pass_query_set_ownership_timestamps(ctx: TestingContext) { let ResourceSetup { gpu_buffer, cpu_buffer, diff --git a/tests/tests/render_pass_ownership.rs b/tests/tests/render_pass_ownership.rs index 9e47897330..f93393673f 100644 --- a/tests/tests/render_pass_ownership.rs +++ b/tests/tests/render_pass_ownership.rs @@ -8,8 +8,7 @@ //! * rpass.multi_draw_indexed_indirect(indirect_buffer, indirect_offset, count) //! * rpass.multi_draw_indirect_count //! * rpass.multi_draw_indexed_indirect_count -//! * rpass.write_timestamp - +//! use std::num::NonZeroU64; use wgpu::util::DeviceExt as _; @@ -125,21 +124,18 @@ async fn render_pass_query_set_ownership_pipeline_statistics(ctx: TestingContext gpu_buffer, cpu_buffer, buffer_size, - indirect_buffer: _, vertex_buffer, index_buffer, bind_group, pipeline, color_attachment_view, - color_attachment_resolve_view: _, - depth_stencil_view, - occlusion_query_set: _, + .. } = resource_setup(&ctx); let query_set = ctx.device.create_query_set(&wgpu::QuerySetDescriptor { label: Some("query_set"), ty: wgpu::QueryType::PipelineStatistics( - wgpu::PipelineStatisticsTypes::COMPUTE_SHADER_INVOCATIONS, + wgpu::PipelineStatisticsTypes::VERTEX_SHADER_INVOCATIONS, ), count: 1, }); @@ -150,7 +146,70 @@ async fn render_pass_query_set_ownership_pipeline_statistics(ctx: TestingContext { let mut rpass = encoder.begin_render_pass(&wgpu::RenderPassDescriptor { - label: Some("render_pass"), + color_attachments: &[Some(wgpu::RenderPassColorAttachment { + view: &color_attachment_view, + resolve_target: None, + ops: wgpu::Operations::default(), + })], + ..Default::default() + }); + rpass.set_pipeline(&pipeline); + rpass.set_bind_group(0, &bind_group, &[]); + rpass.set_vertex_buffer(0, vertex_buffer.slice(..)); + rpass.set_index_buffer(index_buffer.slice(..), wgpu::IndexFormat::Uint32); + rpass.begin_pipeline_statistics_query(&query_set, 0); + rpass.draw(0..3, 0..1); + rpass.end_pipeline_statistics_query(); + + // Drop the query set. Then do a device poll to make sure it's not dropped too early, no matter what. + drop(query_set); + ctx.async_poll(wgpu::Maintain::wait()) + .await + .panic_on_timeout(); + } + + assert_render_pass_executed_normally(encoder, gpu_buffer, cpu_buffer, buffer_size, ctx).await; +} + +#[gpu_test] +static RENDER_PASS_QUERY_SET_OWNERSHIP_TIMESTAMPS: GpuTestConfiguration = + GpuTestConfiguration::new() + .parameters(TestParameters::default().test_features_limits().features( + wgpu::Features::TIMESTAMP_QUERY | wgpu::Features::TIMESTAMP_QUERY_INSIDE_PASSES, + )) + .run_async(render_pass_query_set_ownership_timestamps); + +async fn render_pass_query_set_ownership_timestamps(ctx: TestingContext) { + let ResourceSetup { + gpu_buffer, + cpu_buffer, + buffer_size, + color_attachment_view, + depth_stencil_view, + pipeline, + bind_group, + vertex_buffer, + index_buffer, + .. + } = resource_setup(&ctx); + + let query_set_timestamp_writes = ctx.device.create_query_set(&wgpu::QuerySetDescriptor { + label: Some("query_set_timestamp_writes"), + ty: wgpu::QueryType::Timestamp, + count: 2, + }); + let query_set_write_timestamp = ctx.device.create_query_set(&wgpu::QuerySetDescriptor { + label: Some("query_set_write_timestamp"), + ty: wgpu::QueryType::Timestamp, + count: 1, + }); + + let mut encoder = ctx + .device + .create_command_encoder(&wgpu::CommandEncoderDescriptor::default()); + + { + let mut rpass = encoder.begin_render_pass(&wgpu::RenderPassDescriptor { color_attachments: &[Some(wgpu::RenderPassColorAttachment { view: &color_attachment_view, resolve_target: None, @@ -164,19 +223,24 @@ async fn render_pass_query_set_ownership_pipeline_statistics(ctx: TestingContext }), stencil_ops: None, }), - timestamp_writes: None, - occlusion_query_set: None, + timestamp_writes: Some(wgpu::RenderPassTimestampWrites { + query_set: &query_set_timestamp_writes, + beginning_of_pass_write_index: Some(0), + end_of_pass_write_index: Some(1), + }), + ..Default::default() }); + rpass.write_timestamp(&query_set_write_timestamp, 0); + rpass.set_pipeline(&pipeline); rpass.set_bind_group(0, &bind_group, &[]); rpass.set_vertex_buffer(0, vertex_buffer.slice(..)); rpass.set_index_buffer(index_buffer.slice(..), wgpu::IndexFormat::Uint32); - rpass.begin_pipeline_statistics_query(&query_set, 0); rpass.draw(0..3, 0..1); - rpass.end_pipeline_statistics_query(); - // Drop the query set. Then do a device poll to make sure it's not dropped too early, no matter what. - drop(query_set); + // Drop the query sets. Then do a device poll to make sure they're not dropped too early, no matter what. + drop(query_set_timestamp_writes); + drop(query_set_write_timestamp); ctx.async_poll(wgpu::Maintain::wait()) .await .panic_on_timeout(); From a9ebbc9f3d26367bfc8531b900d2a4129341e159 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Tue, 25 Jun 2024 00:22:40 +0200 Subject: [PATCH 13/15] RenderPass can now be made 'static just like ComputePass. Add respective test --- tests/tests/render_pass_ownership.rs | 70 ++++++++- wgpu/src/lib.rs | 220 +++++++++++++++------------ 2 files changed, 195 insertions(+), 95 deletions(-) diff --git a/tests/tests/render_pass_ownership.rs b/tests/tests/render_pass_ownership.rs index f93393673f..95fc0fbdc9 100644 --- a/tests/tests/render_pass_ownership.rs +++ b/tests/tests/render_pass_ownership.rs @@ -12,7 +12,7 @@ use std::num::NonZeroU64; use wgpu::util::DeviceExt as _; -use wgpu_test::{gpu_test, GpuTestConfiguration, TestParameters, TestingContext}; +use wgpu_test::{gpu_test, valid, GpuTestConfiguration, TestParameters, TestingContext}; // Minimal shader with buffer based side effect - only needed to check whether the render pass has executed at all. const SHADER_SRC: &str = " @@ -129,6 +129,7 @@ async fn render_pass_query_set_ownership_pipeline_statistics(ctx: TestingContext bind_group, pipeline, color_attachment_view, + depth_stencil_view, .. } = resource_setup(&ctx); @@ -151,6 +152,14 @@ async fn render_pass_query_set_ownership_pipeline_statistics(ctx: TestingContext resolve_target: None, ops: wgpu::Operations::default(), })], + depth_stencil_attachment: Some(wgpu::RenderPassDepthStencilAttachment { + view: &depth_stencil_view, + depth_ops: Some(wgpu::Operations { + load: wgpu::LoadOp::Clear(1.0), + store: wgpu::StoreOp::Store, + }), + stencil_ops: None, + }), ..Default::default() }); rpass.set_pipeline(&pipeline); @@ -249,6 +258,65 @@ async fn render_pass_query_set_ownership_timestamps(ctx: TestingContext) { assert_render_pass_executed_normally(encoder, gpu_buffer, cpu_buffer, buffer_size, ctx).await; } +#[gpu_test] +static RENDER_PASS_KEEP_ENCODER_ALIVE: GpuTestConfiguration = GpuTestConfiguration::new() + .parameters(TestParameters::default().test_features_limits()) + .run_async(render_pass_keep_encoder_alive); + +async fn render_pass_keep_encoder_alive(ctx: TestingContext) { + let ResourceSetup { + bind_group, + vertex_buffer, + index_buffer, + pipeline, + color_attachment_view, + depth_stencil_view, + .. + } = resource_setup(&ctx); + + let mut encoder = ctx + .device + .create_command_encoder(&wgpu::CommandEncoderDescriptor::default()); + let rpass = encoder.begin_render_pass(&wgpu::RenderPassDescriptor { + color_attachments: &[Some(wgpu::RenderPassColorAttachment { + view: &color_attachment_view, + resolve_target: None, + ops: wgpu::Operations::default(), + })], + depth_stencil_attachment: Some(wgpu::RenderPassDepthStencilAttachment { + view: &depth_stencil_view, + depth_ops: Some(wgpu::Operations { + load: wgpu::LoadOp::Clear(1.0), + store: wgpu::StoreOp::Store, + }), + stencil_ops: None, + }), + ..Default::default() + }); + + // Now drop the encoder - it is kept alive by the compute pass. + // To do so, we have to make the compute pass forget the lifetime constraint first. + let mut rpass = rpass.forget_lifetime(); + drop(encoder); + + ctx.async_poll(wgpu::Maintain::wait()) + .await + .panic_on_timeout(); + + // Record some a draw command. + rpass.set_pipeline(&pipeline); + rpass.set_bind_group(0, &bind_group, &[]); + rpass.set_vertex_buffer(0, vertex_buffer.slice(..)); + rpass.set_index_buffer(index_buffer.slice(..), wgpu::IndexFormat::Uint32); + rpass.draw(0..3, 0..1); + + // Dropping the pass will still execute the pass, even though there's no way to submit it. + // Ideally, this would log an error, but the encoder is not dropped until the compute pass is dropped, + // making this a valid operation. + // (If instead the encoder was explicitly destroyed or finished, this would be an error.) + valid(&ctx.device, || drop(rpass)); +} + async fn assert_render_pass_executed_normally( mut encoder: wgpu::CommandEncoder, gpu_buffer: wgpu::Buffer, diff --git a/wgpu/src/lib.rs b/wgpu/src/lib.rs index 6b44f08a8e..5eaec79eb2 100644 --- a/wgpu/src/lib.rs +++ b/wgpu/src/lib.rs @@ -1274,9 +1274,19 @@ impl Drop for CommandEncoder { /// https://gpuweb.github.io/gpuweb/#render-pass-encoder). #[derive(Debug)] pub struct RenderPass<'encoder> { + /// The inner data of the render pass, separated out so it's easy to replace the lifetime with 'static if desired. + inner: RenderPassInner, + + /// This lifetime is used to protect the [`CommandEncoder`] from being used + /// while the pass is alive. + encoder_guard: PhantomData<&'encoder ()>, +} + +#[derive(Debug)] +struct RenderPassInner { id: ObjectId, data: Box, - parent: &'encoder mut CommandEncoder, + context: Arc, } /// In-progress recording of a compute pass. @@ -3883,12 +3893,13 @@ impl CommandEncoder { /// Begins recording of a render pass. /// /// This function returns a [`RenderPass`] object which records a single render pass. - // - // TODO(https://github.com/gfx-rs/wgpu/issues/1453): - // Just like with compute passes, we should have a way to opt out of the lifetime constraint. - // See https://github.com/gfx-rs/wgpu/pull/5768 for details - // Once this is done, the documentation for `begin_render_pass` and `begin_compute_pass` should - // be nearly identical. + /// + /// As long as the returned [`RenderPass`] has not ended, + /// any mutating operation on this command encoder causes an error and invalidates it. + /// Note that the `'encoder` lifetime relationship protects against this, + /// but it is possible to opt out of it by calling [`RenderPass::forget_lifetime`]. + /// This can be useful for runtime handling of the encoder->pass + /// dependency e.g. when pass and encoder are stored in the same data structure. pub fn begin_render_pass<'encoder>( &'encoder mut self, desc: &RenderPassDescriptor<'_>, @@ -3901,9 +3912,12 @@ impl CommandEncoder { desc, ); RenderPass { - id, - data, - parent: self, + inner: RenderPassInner { + id, + data, + context: self.context.clone(), + }, + encoder_guard: PhantomData, } } @@ -4175,6 +4189,25 @@ impl CommandEncoder { } impl<'encoder> RenderPass<'encoder> { + /// Drops the lifetime relationship to the parent command encoder, making usage of + /// the encoder while this pass is recorded a run-time error instead. + /// + /// Attention: As long as the render pass has not been ended, any mutating operation on the parent + /// command encoder will cause a run-time error and invalidate it! + /// By default, the lifetime constraint prevents this, but it can be useful + /// to handle this at run time, such as when storing the pass and encoder in the same + /// data structure. + /// + /// This operation has no effect on pass recording. + /// It's a safe operation, since [`CommandEncoder`] is in a locked state as long as the pass is active + /// regardless of the lifetime constraint or its absence. + pub fn forget_lifetime(self) -> RenderPass<'static> { + RenderPass { + inner: self.inner, + encoder_guard: PhantomData, + } + } + /// Sets the active bind group for a given bind group index. The bind group layout /// in the active pipeline when any `draw_*()` method is called must match the layout of /// this bind group. @@ -4191,9 +4224,9 @@ impl<'encoder> RenderPass<'encoder> { offsets: &[DynamicOffset], ) { DynContext::render_pass_set_bind_group( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), index, &bind_group.id, bind_group.data.as_ref(), @@ -4206,9 +4239,9 @@ impl<'encoder> RenderPass<'encoder> { /// Subsequent draw calls will exhibit the behavior defined by `pipeline`. pub fn set_pipeline(&mut self, pipeline: &RenderPipeline) { DynContext::render_pass_set_pipeline( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &pipeline.id, pipeline.data.as_ref(), ) @@ -4221,9 +4254,9 @@ impl<'encoder> RenderPass<'encoder> { /// (all components zero). pub fn set_blend_constant(&mut self, color: Color) { DynContext::render_pass_set_blend_constant( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), color, ) } @@ -4234,9 +4267,9 @@ impl<'encoder> RenderPass<'encoder> { /// use `buffer` as the source index buffer. pub fn set_index_buffer(&mut self, buffer_slice: BufferSlice<'_>, index_format: IndexFormat) { DynContext::render_pass_set_index_buffer( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &buffer_slice.buffer.id, buffer_slice.buffer.data.as_ref(), index_format, @@ -4257,9 +4290,9 @@ impl<'encoder> RenderPass<'encoder> { /// [`draw_indexed`]: RenderPass::draw_indexed pub fn set_vertex_buffer(&mut self, slot: u32, buffer_slice: BufferSlice<'_>) { DynContext::render_pass_set_vertex_buffer( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), slot, &buffer_slice.buffer.id, buffer_slice.buffer.data.as_ref(), @@ -4279,9 +4312,9 @@ impl<'encoder> RenderPass<'encoder> { /// but it does not affect the coordinate system, only which fragments are discarded. pub fn set_scissor_rect(&mut self, x: u32, y: u32, width: u32, height: u32) { DynContext::render_pass_set_scissor_rect( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), x, y, width, @@ -4297,9 +4330,9 @@ impl<'encoder> RenderPass<'encoder> { /// targets. pub fn set_viewport(&mut self, x: f32, y: f32, w: f32, h: f32, min_depth: f32, max_depth: f32) { DynContext::render_pass_set_viewport( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), x, y, w, @@ -4315,9 +4348,9 @@ impl<'encoder> RenderPass<'encoder> { /// If this method has not been called, the stencil reference value defaults to `0`. pub fn set_stencil_reference(&mut self, reference: u32) { DynContext::render_pass_set_stencil_reference( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), reference, ); } @@ -4325,9 +4358,9 @@ impl<'encoder> RenderPass<'encoder> { /// Inserts debug marker. pub fn insert_debug_marker(&mut self, label: &str) { DynContext::render_pass_insert_debug_marker( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), label, ); } @@ -4335,9 +4368,9 @@ impl<'encoder> RenderPass<'encoder> { /// Start record commands and group it into debug marker group. pub fn push_debug_group(&mut self, label: &str) { DynContext::render_pass_push_debug_group( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), label, ); } @@ -4345,9 +4378,9 @@ impl<'encoder> RenderPass<'encoder> { /// Stops command recording and creates debug group. pub fn pop_debug_group(&mut self) { DynContext::render_pass_pop_debug_group( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), ); } @@ -4374,9 +4407,9 @@ impl<'encoder> RenderPass<'encoder> { /// It is not affected by changes to the state that are performed after it is called. pub fn draw(&mut self, vertices: Range, instances: Range) { DynContext::render_pass_draw( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), vertices, instances, ) @@ -4408,9 +4441,9 @@ impl<'encoder> RenderPass<'encoder> { /// It is not affected by changes to the state that are performed after it is called. pub fn draw_indexed(&mut self, indices: Range, base_vertex: i32, instances: Range) { DynContext::render_pass_draw_indexed( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), indices, base_vertex, instances, @@ -4432,9 +4465,9 @@ impl<'encoder> RenderPass<'encoder> { /// See details on the individual flags for more information. pub fn draw_indirect(&mut self, indirect_buffer: &Buffer, indirect_offset: BufferAddress) { DynContext::render_pass_draw_indirect( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &indirect_buffer.id, indirect_buffer.data.as_ref(), indirect_offset, @@ -4461,9 +4494,9 @@ impl<'encoder> RenderPass<'encoder> { indirect_offset: BufferAddress, ) { DynContext::render_pass_draw_indexed_indirect( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &indirect_buffer.id, indirect_buffer.data.as_ref(), indirect_offset, @@ -4484,16 +4517,16 @@ impl<'encoder> RenderPass<'encoder> { .map(|rb| (&rb.id, rb.data.as_ref())); DynContext::render_pass_execute_bundles( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &mut render_bundles, ) } } /// [`Features::MULTI_DRAW_INDIRECT`] must be enabled on the device in order to call these functions. -impl<'a> RenderPass<'a> { +impl<'encoder> RenderPass<'encoder> { /// Dispatches multiple draw calls from the active vertex buffer(s) based on the contents of the `indirect_buffer`. /// `count` draw calls are issued. /// @@ -4511,9 +4544,9 @@ impl<'a> RenderPass<'a> { count: u32, ) { DynContext::render_pass_multi_draw_indirect( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &indirect_buffer.id, indirect_buffer.data.as_ref(), indirect_offset, @@ -4539,9 +4572,9 @@ impl<'a> RenderPass<'a> { count: u32, ) { DynContext::render_pass_multi_draw_indexed_indirect( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &indirect_buffer.id, indirect_buffer.data.as_ref(), indirect_offset, @@ -4583,9 +4616,9 @@ impl<'encoder> RenderPass<'encoder> { max_count: u32, ) { DynContext::render_pass_multi_draw_indirect_count( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &indirect_buffer.id, indirect_buffer.data.as_ref(), indirect_offset, @@ -4630,9 +4663,9 @@ impl<'encoder> RenderPass<'encoder> { max_count: u32, ) { DynContext::render_pass_multi_draw_indexed_indirect_count( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &indirect_buffer.id, indirect_buffer.data.as_ref(), indirect_offset, @@ -4688,9 +4721,9 @@ impl<'encoder> RenderPass<'encoder> { /// [`PushConstant`]: https://docs.rs/naga/latest/naga/enum.StorageClass.html#variant.PushConstant pub fn set_push_constants(&mut self, stages: ShaderStages, offset: u32, data: &[u8]) { DynContext::render_pass_set_push_constants( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), stages, offset, data, @@ -4709,9 +4742,9 @@ impl<'encoder> RenderPass<'encoder> { /// for a string of operations to complete. pub fn write_timestamp(&mut self, query_set: &QuerySet, query_index: u32) { DynContext::render_pass_write_timestamp( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &query_set.id, query_set.data.as_ref(), query_index, @@ -4719,14 +4752,14 @@ impl<'encoder> RenderPass<'encoder> { } } -impl<'a> RenderPass<'a> { +impl<'encoder> RenderPass<'encoder> { /// Start a occlusion query on this render pass. It can be ended with /// `end_occlusion_query`. Occlusion queries may not be nested. pub fn begin_occlusion_query(&mut self, query_index: u32) { DynContext::render_pass_begin_occlusion_query( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), query_index, ); } @@ -4735,22 +4768,22 @@ impl<'a> RenderPass<'a> { /// `begin_occlusion_query`. Occlusion queries may not be nested. pub fn end_occlusion_query(&mut self) { DynContext::render_pass_end_occlusion_query( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), ); } } /// [`Features::PIPELINE_STATISTICS_QUERY`] must be enabled on the device in order to call these functions. -impl<'a> RenderPass<'a> { +impl<'encoder> RenderPass<'encoder> { /// Start a pipeline statistics query on this render pass. It can be ended with /// `end_pipeline_statistics_query`. Pipeline statistics queries may not be nested. pub fn begin_pipeline_statistics_query(&mut self, query_set: &QuerySet, query_index: u32) { DynContext::render_pass_begin_pipeline_statistics_query( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), &query_set.id, query_set.data.as_ref(), query_index, @@ -4761,18 +4794,17 @@ impl<'a> RenderPass<'a> { /// `begin_pipeline_statistics_query`. Pipeline statistics queries may not be nested. pub fn end_pipeline_statistics_query(&mut self) { DynContext::render_pass_end_pipeline_statistics_query( - &*self.parent.context, - &mut self.id, - self.data.as_mut(), + &*self.inner.context, + &mut self.inner.id, + self.inner.data.as_mut(), ); } } -impl<'encoder> Drop for RenderPass<'encoder> { +impl Drop for RenderPassInner { fn drop(&mut self) { if !thread::panicking() { - self.parent - .context + self.context .render_pass_end(&mut self.id, self.data.as_mut()); } } From 5a467d34c893af8dfcd6ac1324017327ec4cc5a6 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sun, 30 Jun 2024 14:29:31 +0200 Subject: [PATCH 14/15] Extend encoder_operations_fail_while_pass_alive test to also check encoder locking errors with render passes --- tests/tests/encoder.rs | 151 ++++++++++++++++++++++++++--------------- 1 file changed, 96 insertions(+), 55 deletions(-) diff --git a/tests/tests/encoder.rs b/tests/tests/encoder.rs index 22b0922ac8..337dffc2d0 100644 --- a/tests/tests/encoder.rs +++ b/tests/tests/encoder.rs @@ -77,18 +77,16 @@ static DROP_ENCODER_AFTER_ERROR: GpuTestConfiguration = GpuTestConfiguration::ne drop(encoder); }); -// TODO: This should also apply to render passes once the lifetime bound is lifted. #[gpu_test] -static ENCODER_OPERATIONS_FAIL_WHILE_COMPUTE_PASS_ALIVE: GpuTestConfiguration = - GpuTestConfiguration::new() - .parameters(TestParameters::default().features( - wgpu::Features::CLEAR_TEXTURE - | wgpu::Features::TIMESTAMP_QUERY - | wgpu::Features::TIMESTAMP_QUERY_INSIDE_ENCODERS, - )) - .run_sync(encoder_operations_fail_while_compute_pass_alive); +static ENCODER_OPERATIONS_FAIL_WHILE_PASS_ALIVE: GpuTestConfiguration = GpuTestConfiguration::new() + .parameters(TestParameters::default().features( + wgpu::Features::CLEAR_TEXTURE + | wgpu::Features::TIMESTAMP_QUERY + | wgpu::Features::TIMESTAMP_QUERY_INSIDE_ENCODERS, + )) + .run_sync(encoder_operations_fail_while_pass_alive); -fn encoder_operations_fail_while_compute_pass_alive(ctx: TestingContext) { +fn encoder_operations_fail_while_pass_alive(ctx: TestingContext) { let buffer_source = ctx .device .create_buffer_init(&wgpu::util::BufferInitDescriptor { @@ -129,6 +127,23 @@ fn encoder_operations_fail_while_compute_pass_alive(ctx: TestingContext) { label: None, }); + let target_desc = wgpu::TextureDescriptor { + label: Some("target_tex"), + size: wgpu::Extent3d { + width: 4, + height: 4, + depth_or_array_layers: 1, + }, + mip_level_count: 1, + sample_count: 1, + dimension: wgpu::TextureDimension::D2, + format: wgpu::TextureFormat::Bgra8UnormSrgb, + usage: wgpu::TextureUsages::RENDER_ATTACHMENT, + view_formats: &[wgpu::TextureFormat::Bgra8UnormSrgb], + }; + let target_tex = ctx.device.create_texture(&target_desc); + let color_attachment_view = target_tex.create_view(&wgpu::TextureViewDescriptor::default()); + #[allow(clippy::type_complexity)] let recording_ops: Vec<(_, Box)> = vec![ ( @@ -252,55 +267,81 @@ fn encoder_operations_fail_while_compute_pass_alive(ctx: TestingContext) { ), ]; - for (op_name, op) in recording_ops.iter() { - let mut encoder = ctx - .device - .create_command_encoder(&wgpu::CommandEncoderDescriptor::default()); + #[derive(Clone, Copy, Debug)] + enum PassType { + Compute, + Render, + } - let pass = encoder - .begin_compute_pass(&wgpu::ComputePassDescriptor::default()) - .forget_lifetime(); + let create_pass = |encoder: &mut wgpu::CommandEncoder, pass_type| -> Box { + match pass_type { + PassType::Compute => Box::new( + encoder + .begin_compute_pass(&wgpu::ComputePassDescriptor::default()) + .forget_lifetime(), + ), + PassType::Render => Box::new( + encoder + .begin_render_pass(&wgpu::RenderPassDescriptor { + color_attachments: &[Some(wgpu::RenderPassColorAttachment { + view: &color_attachment_view, + resolve_target: None, + ops: wgpu::Operations::default(), + })], + ..Default::default() + }) + .forget_lifetime(), + ), + } + }; - ctx.device.push_error_scope(wgpu::ErrorFilter::Validation); + for &pass_type in [PassType::Compute, PassType::Render].iter() { + for (op_name, op) in recording_ops.iter() { + let mut encoder = ctx + .device + .create_command_encoder(&wgpu::CommandEncoderDescriptor::default()); - log::info!("Testing operation {} on a locked command encoder", op_name); - fail( - &ctx.device, - || op(&mut encoder), - Some("Command encoder is locked"), - ); + let pass = create_pass(&mut encoder, pass_type); - // Drop the pass - this also fails now since the encoder is invalid: - fail( - &ctx.device, - || drop(pass), - Some("Command encoder is invalid"), - ); - // Also, it's not possible to create a new pass on the encoder: - fail( - &ctx.device, - || encoder.begin_compute_pass(&wgpu::ComputePassDescriptor::default()), - Some("Command encoder is invalid"), - ); - } + ctx.device.push_error_scope(wgpu::ErrorFilter::Validation); - // Test encoder finishing separately since it consumes the encoder and doesn't fit above pattern. - { - let mut encoder = ctx - .device - .create_command_encoder(&wgpu::CommandEncoderDescriptor::default()); - let pass = encoder - .begin_compute_pass(&wgpu::ComputePassDescriptor::default()) - .forget_lifetime(); - fail( - &ctx.device, - || encoder.finish(), - Some("Command encoder is locked"), - ); - fail( - &ctx.device, - || drop(pass), - Some("Command encoder is invalid"), - ); + log::info!("Testing operation {op_name:?} on a locked command encoder while a {pass_type:?} pass is active"); + fail( + &ctx.device, + || op(&mut encoder), + Some("Command encoder is locked"), + ); + + // Drop the pass - this also fails now since the encoder is invalid: + fail( + &ctx.device, + || drop(pass), + Some("Command encoder is invalid"), + ); + // Also, it's not possible to create a new pass on the encoder: + fail( + &ctx.device, + || encoder.begin_compute_pass(&wgpu::ComputePassDescriptor::default()), + Some("Command encoder is invalid"), + ); + } + + // Test encoder finishing separately since it consumes the encoder and doesn't fit above pattern. + { + let mut encoder = ctx + .device + .create_command_encoder(&wgpu::CommandEncoderDescriptor::default()); + let pass = create_pass(&mut encoder, pass_type); + fail( + &ctx.device, + || encoder.finish(), + Some("Command encoder is locked"), + ); + fail( + &ctx.device, + || drop(pass), + Some("Command encoder is invalid"), + ); + } } } From a463cddc9cb108203f39ec6b5fb16201ade83418 Mon Sep 17 00:00:00 2001 From: Andreas Reich Date: Sun, 30 Jun 2024 14:53:56 +0200 Subject: [PATCH 15/15] improve changelog entry on lifetime bounds --- CHANGELOG.md | 30 ++++++++++++++++++++++-------- 1 file changed, 22 insertions(+), 8 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index a2ea1b8fa5..710fb2d6d5 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -41,24 +41,38 @@ Bottom level categories: ### Major Changes -#### Remove lifetime bounds on `wgpu::ComputePass` +#### Lifetime bounds on `wgpu::RenderPass` & `wgpu::ComputePass` -TODO(wumpf): This is still work in progress. Should write a bit more about it. Also will very likely extend to `wgpu::RenderPass` before release. +`wgpu::RenderPass` & `wgpu::ComputePass` recording methods (e.g. `wgpu::RenderPass:set_render_pipeline`) no longer impose a lifetime constraint to objects passed to a pass (like pipelines/buffers/bindgroups/query-sets etc.). + +This means the following pattern works now as expected: +```rust +let mut pipelines: Vec = ...; +// ... +let mut cpass = encoder.begin_compute_pass(&wgpu::ComputePassDescriptor::default()); +cpass.set_pipeline(&pipelines[123]); +// Change pipeline container - this requires mutable access to `pipelines` while one of the pipelines is in use. +pipelines.push(/* ... */); +// Continue pass recording. +cpass.set_bindgroup(...); +``` +Previously, a set pipeline (or other resource) had to outlive pass recording which often affected wider systems, +meaning that users needed to prove to the borrow checker that `Vec` (or similar constructs) +aren't accessed mutably for the duration of pass recording. -`wgpu::ComputePass` recording methods (e.g. `wgpu::ComputePass:set_render_pipeline`) no longer impose a lifetime constraint passed in resources. -Furthermore, you can now opt out of `wgpu::ComputePass`'s lifetime dependency on its parent `wgpu::CommandEncoder` using `wgpu::ComputePass::forget_lifetime`: +Furthermore, you can now opt out of `wgpu::RenderPass`/`wgpu::ComputePass`'s lifetime dependency on its parent `wgpu::CommandEncoder` using `wgpu::RenderPass::forget_lifetime`/`wgpu::ComputePass::forget_lifetime`: ```rust fn independent_cpass<'enc>(encoder: &'enc mut wgpu::CommandEncoder) -> wgpu::ComputePass<'static> { let cpass: wgpu::ComputePass<'enc> = encoder.begin_compute_pass(&wgpu::ComputePassDescriptor::default()); cpass.forget_lifetime() } ``` -⚠️ As long as a `wgpu::ComputePass` is pending for a given `wgpu::CommandEncoder`, creation of a compute or render pass is an error and invalidates the `wgpu::CommandEncoder`. -This is very useful for library authors, but opens up an easy way for incorrect use, so use with care. -`forget_lifetime` is zero overhead and has no side effects on pass recording. +⚠️ As long as a `wgpu::RenderPass`/`wgpu::ComputePass` is pending for a given `wgpu::CommandEncoder`, creation of a compute or render pass is an error and invalidates the `wgpu::CommandEncoder`. +`forget_lifetime` can be very useful for library authors, but opens up an easy way for incorrect use, so use with care. +This method doesn't add any additional overhead and has no side effects on pass recording. -By @wumpf in [#5569](https://github.com/gfx-rs/wgpu/pull/5569), [#5575](https://github.com/gfx-rs/wgpu/pull/5575), [#5620](https://github.com/gfx-rs/wgpu/pull/5620), [#5768](https://github.com/gfx-rs/wgpu/pull/5768) (together with @kpreid), [#5671](https://github.com/gfx-rs/wgpu/pull/5671). +By @wumpf in [#5569](https://github.com/gfx-rs/wgpu/pull/5569), [#5575](https://github.com/gfx-rs/wgpu/pull/5575), [#5620](https://github.com/gfx-rs/wgpu/pull/5620), [#5768](https://github.com/gfx-rs/wgpu/pull/5768) (together with @kpreid), [#5671](https://github.com/gfx-rs/wgpu/pull/5671), [#5794](https://github.com/gfx-rs/wgpu/pull/5794), [#5884](https://github.com/gfx-rs/wgpu/pull/5884). #### Querying shader compilation errors