impeller/renderer/backend/vulkan/compute_pass_vk.cc - mirrors/engine - Git at Google

 // Copyright 2013 The Flutter Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "impeller/renderer/backend/vulkan/compute_pass_vk.h"

 #include "flutter/fml/trace_event.h"
 #include "impeller/renderer/backend/vulkan/command_buffer_vk.h"
 #include "impeller/renderer/backend/vulkan/compute_pipeline_vk.h"
 #include "impeller/renderer/backend/vulkan/sampler_vk.h"
 #include "impeller/renderer/backend/vulkan/texture_vk.h"

 namespace impeller {

 ComputePassVK::ComputePassVK(std::weak_ptr<const Context> context,
                              std::weak_ptr<CommandBufferVK> command_buffer)
     : ComputePass(std::move(context)),
       command_buffer_(std::move(command_buffer)) {
   is_valid_ = true;
 }

 ComputePassVK::~ComputePassVK() = default;

 bool ComputePassVK::IsValid() const {
   return is_valid_;
 }

 void ComputePassVK::OnSetLabel(const std::string& label) {
   if (label.empty()) {
     return;
   }
   label_ = label;
 }

 static bool UpdateBindingLayouts(const Bindings& bindings,
                                  const vk::CommandBuffer& buffer) {
   BarrierVK barrier;
   barrier.cmd_buffer = buffer;
   barrier.src_access = vk::AccessFlagBits::eTransferWrite;
   barrier.src_stage = vk::PipelineStageFlagBits::eTransfer;
   barrier.dst_access = vk::AccessFlagBits::eShaderRead;
   barrier.dst_stage = vk::PipelineStageFlagBits::eComputeShader;

   barrier.new_layout = vk::ImageLayout::eShaderReadOnlyOptimal;

   for (const auto& [_, data] : bindings.sampled_images) {
     if (!TextureVK::Cast(*data.texture.resource).SetLayout(barrier)) {
       return false;
     }
   }
   return true;
 }

 static bool UpdateBindingLayouts(const ComputeCommand& command,
                                  const vk::CommandBuffer& buffer) {
   return UpdateBindingLayouts(command.bindings, buffer);
 }

 static bool UpdateBindingLayouts(const std::vector<ComputeCommand>& commands,
                                  const vk::CommandBuffer& buffer) {
   for (const auto& command : commands) {
     if (!UpdateBindingLayouts(command, buffer)) {
       return false;
     }
   }
   return true;
 }

 static bool AllocateAndBindDescriptorSets(const ContextVK& context,
                                           const ComputeCommand& command,
                                           CommandEncoderVK& encoder,
                                           const ComputePipelineVK& pipeline,
                                           size_t command_count) {
   auto desc_set = pipeline.GetDescriptor().GetDescriptorSetLayouts();
   auto vk_desc_set = encoder.AllocateDescriptorSet(
       pipeline.GetDescriptorSetLayout(), command_count);
   if (!vk_desc_set) {
     return false;
   }

   auto& allocator = *context.GetResourceAllocator();

   std::unordered_map<uint32_t, vk::DescriptorBufferInfo> buffers;
   std::unordered_map<uint32_t, vk::DescriptorImageInfo> images;
   std::vector<vk::WriteDescriptorSet> writes;
   auto bind_images = [&encoder,     //
                       &images,      //
                       &writes,      //
                       &vk_desc_set  //
   ](const Bindings& bindings) -> bool {
     for (const auto& [index, data] : bindings.sampled_images) {
       auto texture = data.texture.resource;
       const auto& texture_vk = TextureVK::Cast(*texture);
       const SamplerVK& sampler = SamplerVK::Cast(*data.sampler.resource);

       if (!encoder.Track(texture) ||
           !encoder.Track(sampler.GetSharedSampler())) {
         return false;
       }

       const SampledImageSlot& slot = data.slot;

       vk::DescriptorImageInfo image_info;
       image_info.imageLayout = vk::ImageLayout::eShaderReadOnlyOptimal;
       image_info.sampler = sampler.GetSampler();
       image_info.imageView = texture_vk.GetImageView();

       vk::WriteDescriptorSet write_set;
       write_set.dstSet = vk_desc_set.value();
       write_set.dstBinding = slot.binding;
       write_set.descriptorCount = 1u;
       write_set.descriptorType = vk::DescriptorType::eCombinedImageSampler;
       write_set.pImageInfo = &(images[slot.binding] = image_info);

       writes.push_back(write_set);
     }

     return true;
   };

   auto bind_buffers = [&allocator,   //
                        &encoder,     //
                        &buffers,     //
                        &writes,      //
                        &desc_set,    //
                        &vk_desc_set  //
   ](const Bindings& bindings) -> bool {
     for (const auto& [buffer_index, data] : bindings.buffers) {
       const auto& buffer_view = data.view.resource.buffer;

       auto device_buffer = buffer_view->GetDeviceBuffer(allocator);
       if (!device_buffer) {
         VALIDATION_LOG << "Failed to get device buffer for vertex binding";
         return false;
       }

       auto buffer = DeviceBufferVK::Cast(*device_buffer).GetBuffer();
       if (!buffer) {
         return false;
       }

       if (!encoder.Track(device_buffer)) {
         return false;
       }

       uint32_t offset = data.view.resource.range.offset;

       vk::DescriptorBufferInfo buffer_info;
       buffer_info.buffer = buffer;
       buffer_info.offset = offset;
       buffer_info.range = data.view.resource.range.length;

       const ShaderUniformSlot& uniform = data.slot;
       auto layout_it = std::find_if(desc_set.begin(), desc_set.end(),
                                     [&uniform](DescriptorSetLayout& layout) {
                                       return layout.binding == uniform.binding;
                                     });
       if (layout_it == desc_set.end()) {
         VALIDATION_LOG << "Failed to get descriptor set layout for binding "
                        << uniform.binding;
         return false;
       }
       auto layout = *layout_it;

       vk::WriteDescriptorSet write_set;
       write_set.dstSet = vk_desc_set.value();
       write_set.dstBinding = uniform.binding;
       write_set.descriptorCount = 1u;
       write_set.descriptorType = ToVKDescriptorType(layout.descriptor_type);
       write_set.pBufferInfo = &(buffers[uniform.binding] = buffer_info);

       writes.push_back(write_set);
     }
     return true;
   };

   if (!bind_buffers(command.bindings) || !bind_images(command.bindings)) {
     return false;
   }

   context.GetDevice().updateDescriptorSets(writes, {});

   encoder.GetCommandBuffer().bindDescriptorSets(
       vk::PipelineBindPoint::eCompute,    // bind point
       pipeline.GetPipelineLayout(),       // layout
       0,                                  // first set
       {vk::DescriptorSet{*vk_desc_set}},  // sets
       nullptr                             // offsets
   );
   return true;
 }

 bool ComputePassVK::OnEncodeCommands(const Context& context,
                                      const ISize& grid_size,
                                      const ISize& thread_group_size) const {
   TRACE_EVENT0("impeller", "ComputePassVK::EncodeCommands");
   if (!IsValid()) {
     return false;
   }

   FML_DCHECK(!grid_size.IsEmpty() && !thread_group_size.IsEmpty());

   const auto& vk_context = ContextVK::Cast(context);
   auto command_buffer = command_buffer_.lock();
   if (!command_buffer) {
     VALIDATION_LOG << "Command buffer died before commands could be encoded.";
     return false;
   }
   auto encoder = command_buffer->GetEncoder();
   if (!encoder) {
     return false;
   }

   fml::ScopedCleanupClosure pop_marker(
       [&encoder]() { encoder->PopDebugGroup(); });
   if (!label_.empty()) {
     encoder->PushDebugGroup(label_.c_str());
   } else {
     pop_marker.Release();
   }
   auto cmd_buffer = encoder->GetCommandBuffer();

   if (!UpdateBindingLayouts(commands_, cmd_buffer)) {
     VALIDATION_LOG << "Could not update binding layouts for compute pass.";
     return false;
   }

   {
     TRACE_EVENT0("impeller", "EncodeComputePassCommands");

     for (const auto& command : commands_) {
       if (!command.pipeline) {
         continue;
       }

       const auto& pipeline_vk = ComputePipelineVK::Cast(*command.pipeline);

       cmd_buffer.bindPipeline(vk::PipelineBindPoint::eCompute,
                               pipeline_vk.GetPipeline());
       if (!AllocateAndBindDescriptorSets(vk_context,       //
                                          command,          //
                                          *encoder,         //
                                          pipeline_vk,      //
                                          commands_.size()  //
                                          )) {
         return false;
       }

       // TOOD(dnfield): This should be moved to caps. But for now keeping this
       // in parallel with Metal.
       auto device_properties = vk_context.GetPhysicalDevice().getProperties();

       auto max_wg_size = device_properties.limits.maxComputeWorkGroupSize;

       int64_t width = grid_size.width;
       int64_t height = grid_size.height;

       // Special case for linear processing.
       if (height == 1) {
         int64_t minimum = 1;
         int64_t threadGroups = std::max(
             static_cast<int64_t>(std::ceil(width * 1.0 / max_wg_size[0] * 1.0)),
             minimum);
         cmd_buffer.dispatch(threadGroups, 1, 1);
       } else {
         while (width > max_wg_size[0]) {
           width = std::max(static_cast<int64_t>(1), width / 2);
         }
         while (height > max_wg_size[1]) {
           height = std::max(static_cast<int64_t>(1), height / 2);
         }
         cmd_buffer.dispatch(width, height, 1);
       }
     }
   }

   return true;
 }

 }  // namespace impeller
	// Copyright 2013 The Flutter Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#include "impeller/renderer/backend/vulkan/compute_pass_vk.h"

	#include "flutter/fml/trace_event.h"
	#include "impeller/renderer/backend/vulkan/command_buffer_vk.h"
	#include "impeller/renderer/backend/vulkan/compute_pipeline_vk.h"
	#include "impeller/renderer/backend/vulkan/sampler_vk.h"
	#include "impeller/renderer/backend/vulkan/texture_vk.h"

	namespace impeller {

	ComputePassVK::ComputePassVK(std::weak_ptr<const Context> context,
	std::weak_ptr<CommandBufferVK> command_buffer)
	: ComputePass(std::move(context)),
	command_buffer_(std::move(command_buffer)) {
	is_valid_ = true;
	}

	ComputePassVK::~ComputePassVK() = default;

	bool ComputePassVK::IsValid() const {
	return is_valid_;
	}

	void ComputePassVK::OnSetLabel(const std::string& label) {
	if (label.empty()) {
	return;
	}
	label_ = label;
	}

	static bool UpdateBindingLayouts(const Bindings& bindings,
	const vk::CommandBuffer& buffer) {
	BarrierVK barrier;
	barrier.cmd_buffer = buffer;
	barrier.src_access = vk::AccessFlagBits::eTransferWrite;
	barrier.src_stage = vk::PipelineStageFlagBits::eTransfer;
	barrier.dst_access = vk::AccessFlagBits::eShaderRead;
	barrier.dst_stage = vk::PipelineStageFlagBits::eComputeShader;

	barrier.new_layout = vk::ImageLayout::eShaderReadOnlyOptimal;

	for (const auto& [_, data] : bindings.sampled_images) {
	if (!TextureVK::Cast(*data.texture.resource).SetLayout(barrier)) {
	return false;
	}
	}
	return true;
	}

	static bool UpdateBindingLayouts(const ComputeCommand& command,
	const vk::CommandBuffer& buffer) {
	return UpdateBindingLayouts(command.bindings, buffer);
	}

	static bool UpdateBindingLayouts(const std::vector<ComputeCommand>& commands,
	const vk::CommandBuffer& buffer) {
	for (const auto& command : commands) {
	if (!UpdateBindingLayouts(command, buffer)) {
	return false;
	}
	}
	return true;
	}

	static bool AllocateAndBindDescriptorSets(const ContextVK& context,
	const ComputeCommand& command,
	CommandEncoderVK& encoder,
	const ComputePipelineVK& pipeline,
	size_t command_count) {
	auto desc_set = pipeline.GetDescriptor().GetDescriptorSetLayouts();
	auto vk_desc_set = encoder.AllocateDescriptorSet(
	pipeline.GetDescriptorSetLayout(), command_count);
	if (!vk_desc_set) {
	return false;
	}

	auto& allocator = *context.GetResourceAllocator();

	std::unordered_map<uint32_t, vk::DescriptorBufferInfo> buffers;
	std::unordered_map<uint32_t, vk::DescriptorImageInfo> images;
	std::vector<vk::WriteDescriptorSet> writes;
	auto bind_images = [&encoder, //
	&images, //
	&writes, //
	&vk_desc_set //
	](const Bindings& bindings) -> bool {
	for (const auto& [index, data] : bindings.sampled_images) {
	auto texture = data.texture.resource;
	const auto& texture_vk = TextureVK::Cast(*texture);
	const SamplerVK& sampler = SamplerVK::Cast(*data.sampler.resource);

	if (!encoder.Track(texture) \|\|
	!encoder.Track(sampler.GetSharedSampler())) {
	return false;
	}

	const SampledImageSlot& slot = data.slot;

	vk::DescriptorImageInfo image_info;
	image_info.imageLayout = vk::ImageLayout::eShaderReadOnlyOptimal;
	image_info.sampler = sampler.GetSampler();
	image_info.imageView = texture_vk.GetImageView();

	vk::WriteDescriptorSet write_set;
	write_set.dstSet = vk_desc_set.value();
	write_set.dstBinding = slot.binding;
	write_set.descriptorCount = 1u;
	write_set.descriptorType = vk::DescriptorType::eCombinedImageSampler;
	write_set.pImageInfo = &(images[slot.binding] = image_info);

	writes.push_back(write_set);
	}

	return true;
	};

	auto bind_buffers = [&allocator, //
	&encoder, //
	&buffers, //
	&writes, //
	&desc_set, //
	&vk_desc_set //
	](const Bindings& bindings) -> bool {
	for (const auto& [buffer_index, data] : bindings.buffers) {
	const auto& buffer_view = data.view.resource.buffer;

	auto device_buffer = buffer_view->GetDeviceBuffer(allocator);
	if (!device_buffer) {
	VALIDATION_LOG << "Failed to get device buffer for vertex binding";
	return false;
	}

	auto buffer = DeviceBufferVK::Cast(*device_buffer).GetBuffer();
	if (!buffer) {
	return false;
	}

	if (!encoder.Track(device_buffer)) {
	return false;
	}

	uint32_t offset = data.view.resource.range.offset;

	vk::DescriptorBufferInfo buffer_info;
	buffer_info.buffer = buffer;
	buffer_info.offset = offset;
	buffer_info.range = data.view.resource.range.length;

	const ShaderUniformSlot& uniform = data.slot;
	auto layout_it = std::find_if(desc_set.begin(), desc_set.end(),
	[&uniform](DescriptorSetLayout& layout) {
	return layout.binding == uniform.binding;
	});
	if (layout_it == desc_set.end()) {
	VALIDATION_LOG << "Failed to get descriptor set layout for binding "
	<< uniform.binding;
	return false;
	}
	auto layout = *layout_it;

	vk::WriteDescriptorSet write_set;
	write_set.dstSet = vk_desc_set.value();
	write_set.dstBinding = uniform.binding;
	write_set.descriptorCount = 1u;
	write_set.descriptorType = ToVKDescriptorType(layout.descriptor_type);
	write_set.pBufferInfo = &(buffers[uniform.binding] = buffer_info);

	writes.push_back(write_set);
	}
	return true;
	};

	if (!bind_buffers(command.bindings) \|\| !bind_images(command.bindings)) {
	return false;
	}

	context.GetDevice().updateDescriptorSets(writes, {});

	encoder.GetCommandBuffer().bindDescriptorSets(
	vk::PipelineBindPoint::eCompute, // bind point
	pipeline.GetPipelineLayout(), // layout
	0, // first set
	{vk::DescriptorSet{*vk_desc_set}}, // sets
	nullptr // offsets
	);
	return true;
	}

	bool ComputePassVK::OnEncodeCommands(const Context& context,
	const ISize& grid_size,
	const ISize& thread_group_size) const {
	TRACE_EVENT0("impeller", "ComputePassVK::EncodeCommands");
	if (!IsValid()) {
	return false;
	}

	FML_DCHECK(!grid_size.IsEmpty() && !thread_group_size.IsEmpty());

	const auto& vk_context = ContextVK::Cast(context);
	auto command_buffer = command_buffer_.lock();
	if (!command_buffer) {
	VALIDATION_LOG << "Command buffer died before commands could be encoded.";
	return false;
	}
	auto encoder = command_buffer->GetEncoder();
	if (!encoder) {
	return false;
	}

	fml::ScopedCleanupClosure pop_marker(
	[&encoder]() { encoder->PopDebugGroup(); });
	if (!label_.empty()) {
	encoder->PushDebugGroup(label_.c_str());
	} else {
	pop_marker.Release();
	}
	auto cmd_buffer = encoder->GetCommandBuffer();

	if (!UpdateBindingLayouts(commands_, cmd_buffer)) {
	VALIDATION_LOG << "Could not update binding layouts for compute pass.";
	return false;
	}

	{
	TRACE_EVENT0("impeller", "EncodeComputePassCommands");

	for (const auto& command : commands_) {
	if (!command.pipeline) {
	continue;
	}

	const auto& pipeline_vk = ComputePipelineVK::Cast(*command.pipeline);

	cmd_buffer.bindPipeline(vk::PipelineBindPoint::eCompute,
	pipeline_vk.GetPipeline());
	if (!AllocateAndBindDescriptorSets(vk_context, //
	command, //
	*encoder, //
	pipeline_vk, //
	commands_.size() //
	)) {
	return false;
	}

	// TOOD(dnfield): This should be moved to caps. But for now keeping this
	// in parallel with Metal.
	auto device_properties = vk_context.GetPhysicalDevice().getProperties();

	auto max_wg_size = device_properties.limits.maxComputeWorkGroupSize;

	int64_t width = grid_size.width;
	int64_t height = grid_size.height;

	// Special case for linear processing.
	if (height == 1) {
	int64_t minimum = 1;
	int64_t threadGroups = std::max(
	static_cast<int64_t>(std::ceil(width * 1.0 / max_wg_size[0] * 1.0)),
	minimum);
	cmd_buffer.dispatch(threadGroups, 1, 1);
	} else {
	while (width > max_wg_size[0]) {
	width = std::max(static_cast<int64_t>(1), width / 2);
	}
	while (height > max_wg_size[1]) {
	height = std::max(static_cast<int64_t>(1), height / 2);
	}
	cmd_buffer.dispatch(width, height, 1);
	}
	}
	}

	return true;
	}

	} // namespace impeller