From 04ac773bc61fa636594dc4224323fbf15729b697 Mon Sep 17 00:00:00 2001
From: Connor Fitzgerald <connorwadefitzgerald@gmail.com>
Date: Sun, 16 Aug 2020 20:27:37 -0400
Subject: [PATCH] [rs] Convert StagingBelt to take a &mut CommandEncoder

---
 wgpu/examples/skybox/main.rs | 13 +++++++-----
 wgpu/src/util/belt.rs        | 39 ++++++++++++++++++------------------
 2 files changed, 27 insertions(+), 25 deletions(-)
diff --git a/wgpu/examples/skybox/main.rs b/wgpu/examples/skybox/main.rs
index 454b48c2e6..858de6ed85 100644
--- a/wgpu/examples/skybox/main.rs
+++ b/wgpu/examples/skybox/main.rs
@@ -277,7 +277,7 @@ impl framework::Example for Skybox {
             uniform_buf,
             aspect,
             uniforms,
-            staging_belt: wgpu::util::StagingBelt::new(0x100, device),
+            staging_belt: wgpu::util::StagingBelt::new(0x100),
         }
     }
 
@@ -305,22 +305,25 @@ impl framework::Example for Skybox {
         queue: &wgpu::Queue,
         spawner: &impl LocalSpawn,
     ) {
+        let mut encoder =
+            device.create_command_encoder(&wgpu::CommandEncoderDescriptor { label: None });
+
         // update rotation
         let rotation = cgmath::Matrix4::<f32>::from_angle_x(cgmath::Deg(0.25));
         self.uniforms[1] = self.uniforms[1] * rotation;
         let raw_uniforms = raw_uniforms(&self.uniforms);
         self.staging_belt
             .write_buffer(
+                &mut encoder,
                 &self.uniform_buf,
                 0,
                 wgpu::BufferSize::new((raw_uniforms.len() * 4) as wgpu::BufferAddress).unwrap(),
                 device,
             )
             .copy_from_slice(bytemuck::cast_slice(&raw_uniforms));
-        let transfer_comb = self.staging_belt.flush(device);
 
-        let mut encoder =
-            device.create_command_encoder(&wgpu::CommandEncoderDescriptor { label: None });
+        self.staging_belt.finish();
+
         {
             let mut rpass = encoder.begin_render_pass(&wgpu::RenderPassDescriptor {
                 color_attachments: &[wgpu::RenderPassColorAttachmentDescriptor {
@@ -344,7 +347,7 @@ impl framework::Example for Skybox {
             rpass.draw(0..3 as u32, 0..1);
         }
 
-        queue.submit(vec![transfer_comb, encoder.finish()]);
+        queue.submit(std::iter::once(encoder.finish()));
 
         let belt_future = self.staging_belt.recall();
         spawner.spawn_local(belt_future).unwrap();
diff --git a/wgpu/src/util/belt.rs b/wgpu/src/util/belt.rs
index 6d780785cd..7c4662406d 100644
--- a/wgpu/src/util/belt.rs
+++ b/wgpu/src/util/belt.rs
@@ -1,9 +1,9 @@
 use crate::{
-    Buffer, BufferAddress, BufferDescriptor, BufferSize, BufferUsage, BufferViewMut, CommandBuffer,
-    CommandEncoder, CommandEncoderDescriptor, Device, MapMode,
+    Buffer, BufferAddress, BufferDescriptor, BufferSize, BufferUsage, BufferViewMut,
+    CommandEncoder, Device, MapMode,
 };
 use futures::{future::join_all, FutureExt};
-use std::{future::Future, mem, sync::mpsc};
+use std::{future::Future, sync::mpsc};
 
 struct Chunk {
     buffer: Buffer,
@@ -16,9 +16,14 @@ struct Chunk {
 /// Internally it uses a ring-buffer of staging buffers that are sub-allocated.
 /// It has an advantage over `Queue.write_buffer` in a way that it returns a mutable slice,
 /// which you can fill to avoid an extra data copy.
+///
+/// Using a staging belt is slightly complicated, and generally goes as follows:
+/// - Write to buffers that need writing to using `write_buffer`.
+/// - Call `finish`.
+/// - Submit all command encoders used with `write_buffer`.
+/// - Call `recall`
 pub struct StagingBelt {
     chunk_size: BufferAddress,
-    encoder: CommandEncoder,
     /// Chunks that we are actively using for pending transfers at this moment.
     active_chunks: Vec<Chunk>,
     /// Chunks that have scheduled transfers already.
@@ -35,11 +40,10 @@ impl StagingBelt {
     /// The `chunk_size` is the unit of internal buffer allocation.
     /// It's better when it's big, but ideally still 1-4 times less than
     /// the total amount of data uploaded per submission.
-    pub fn new(chunk_size: BufferAddress, device: &Device) -> Self {
+    pub fn new(chunk_size: BufferAddress) -> Self {
         let (sender, receiver) = mpsc::channel();
         StagingBelt {
             chunk_size,
-            encoder: device.create_command_encoder(&CommandEncoderDescriptor::default()),
             active_chunks: Vec::new(),
             closed_chunks: Vec::new(),
             free_chunks: Vec::new(),
@@ -51,9 +55,11 @@ impl StagingBelt {
     /// Allocate the staging belt slice of `size` to be uploaded into the `target` buffer
     /// at the specified offset.
     ///
-    /// The upload will only really be scheduled at the next `StagingBelt::flush` call.
+    /// The upload will be placed into the provided command encoder. This encoder
+    /// must be submitted after `finish` is called and before `recall` is called.
     pub fn write_buffer(
         &mut self,
+        encoder: &mut CommandEncoder,
         target: &Buffer,
         offset: BufferAddress,
         size: BufferSize,
@@ -87,8 +93,7 @@ impl StagingBelt {
             }
         };
 
-        self.encoder
-            .copy_buffer_to_buffer(&chunk.buffer, chunk.offset, target, offset, size.get());
+        encoder.copy_buffer_to_buffer(&chunk.buffer, chunk.offset, target, offset, size.get());
         let old_offset = chunk.offset;
         chunk.offset += size.get();
         let remainder = chunk.offset % crate::COPY_BUFFER_ALIGNMENT;
@@ -105,29 +110,23 @@ impl StagingBelt {
             .get_mapped_range_mut()
     }
 
-    /// Produce a command buffer with all the accumulated transfers.
+    /// Prepare currently mapped buffers for use in a submission.
     ///
     /// At this point, all the partially used staging buffers are closed until
     /// the GPU is done copying the data from them.
-    pub fn flush(&mut self, device: &Device) -> CommandBuffer {
+    pub fn finish(&mut self) {
         #[cfg(not(target_arch = "wasm32"))]
-        wgc::span!(_guard, DEBUG, "Flushing chunks");
+        wgc::span!(_guard, DEBUG, "Finishing chunks");
 
         for chunk in self.active_chunks.drain(..) {
             chunk.buffer.unmap();
             self.closed_chunks.push(chunk);
         }
-
-        mem::replace(
-            &mut self.encoder,
-            device.create_command_encoder(&CommandEncoderDescriptor::default()),
-        )
-        .finish()
     }
 
-    /// Recall all of the closed buffers back for re-usal.
+    /// Recall all of the closed buffers back to be reused.
     ///
-    /// This has to be called after the command buffer produced by `flush` is submitted!
+    /// This has to be called after the command encoders written to `write_buffer` are submitted!
     pub fn recall(&mut self) -> impl Future<Output = ()> + Send {
         while let Ok(mut chunk) = self.receiver.try_recv() {
             chunk.offset = 0;