src/dawn/native/metal/ComputePipelineMTL.mm - dawn - Git at Google

 // Copyright 2017 The Dawn & Tint Authors
 //
 // Redistribution and use in source and binary forms, with or without
 // modification, are permitted provided that the following conditions are met:
 //
 // 1. Redistributions of source code must retain the above copyright notice, this
 //    list of conditions and the following disclaimer.
 //
 // 2. Redistributions in binary form must reproduce the above copyright notice,
 //    this list of conditions and the following disclaimer in the documentation
 //    and/or other materials provided with the distribution.
 //
 // 3. Neither the name of the copyright holder nor the names of its
 //    contributors may be used to endorse or promote products derived from
 //    this software without specific prior written permission.
 //
 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 // DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
 // FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 // DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 // SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 // OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 #include "dawn/native/metal/ComputePipelineMTL.h"

 #include "dawn/common/Math.h"
 #include "dawn/native/Adapter.h"
 #include "dawn/native/CreatePipelineAsyncTask.h"
 #include "dawn/native/Instance.h"
 #include "dawn/native/metal/BackendMTL.h"
 #include "dawn/native/metal/DeviceMTL.h"
 #include "dawn/native/metal/ShaderModuleMTL.h"
 #include "dawn/native/metal/UtilsMetal.h"
 #include "dawn/platform/metrics/HistogramMacros.h"

 namespace dawn::native::metal {

 // static
 Ref<ComputePipeline> ComputePipeline::CreateUninitialized(
     Device* device,
     const UnpackedPtr<ComputePipelineDescriptor>& descriptor) {
     return AcquireRef(new ComputePipeline(device, descriptor));
 }

 ComputePipeline::ComputePipeline(DeviceBase* dev,
                                  const UnpackedPtr<ComputePipelineDescriptor>& desc)
     : ComputePipelineBase(dev, desc) {}

 ComputePipeline::~ComputePipeline() = default;

 MaybeError ComputePipeline::InitializeImpl() {
     auto mtlDevice = ToBackend(GetDevice())->GetMTLDevice();

     const ProgrammableStage& computeStage = GetStage(SingleShaderStage::Compute);
     ShaderModule::MetalFunctionData computeData;

     DAWN_TRY(ToBackend(computeStage.module.Get())
                  ->CreateFunction(
                      SingleShaderStage::Compute, computeStage, ToBackend(GetLayout()), &computeData,
                      /* sampleMask */ 0xFFFFFFFF,
                      /* renderPipeline */ nullptr,
                      /* maxSubgroupSizeForFullSubgroups */
                      IsFullSubgroupsRequired()
                          ? std::make_optional(
                                GetDevice()->GetLimits().experimentalSubgroupLimits.maxSubgroupSize)
                          : std::nullopt));

     NSError* error = nullptr;
     NSRef<NSString> label = MakeDebugName(GetDevice(), "Dawn_ComputePipeline", GetLabel());

     NSRef<MTLComputePipelineDescriptor> descriptorRef =
         AcquireNSRef([MTLComputePipelineDescriptor new]);
     MTLComputePipelineDescriptor* descriptor = descriptorRef.Get();
     descriptor.computeFunction = computeData.function.Get();
     descriptor.label = label.Get();

     if (IsFullSubgroupsRequired()) {
         descriptor.threadGroupSizeIsMultipleOfThreadExecutionWidth = true;
     }

     platform::metrics::DawnHistogramTimer timer(GetDevice()->GetPlatform());
     mMtlComputePipelineState.Acquire([mtlDevice
         newComputePipelineStateWithDescriptor:descriptor
                                       options:MTLPipelineOptionNone
                                    reflection:nil
                                         error:&error]);
     if (error != nullptr) {
         return DAWN_INTERNAL_ERROR("Error creating pipeline state " +
                                    std::string([error.localizedDescription UTF8String]));
     }
     DAWN_ASSERT(mMtlComputePipelineState != nil);
     timer.RecordMicroseconds("Metal.newComputePipelineStateWithDescriptor.CacheMiss");

     // Copy over the local workgroup size as it is passed to dispatch explicitly in Metal
     mLocalWorkgroupSize = computeData.localWorkgroupSize;

     mRequiresStorageBufferLength = computeData.needsStorageBufferLength;
     mWorkgroupAllocations = std::move(computeData.workgroupAllocations);
     return {};
 }

 void ComputePipeline::Encode(id<MTLComputeCommandEncoder> encoder) {
     [encoder setComputePipelineState:mMtlComputePipelineState.Get()];
     for (size_t i = 0; i < mWorkgroupAllocations.size(); ++i) {
         if (mWorkgroupAllocations[i] == 0) {
             continue;
         }
         // Size must be a multiple of 16 bytes.
         uint32_t rounded = Align<uint32_t>(mWorkgroupAllocations[i], 16);
         [encoder setThreadgroupMemoryLength:rounded atIndex:i];
     }
 }

 MTLSize ComputePipeline::GetLocalWorkGroupSize() const {
     return mLocalWorkgroupSize;
 }

 bool ComputePipeline::RequiresStorageBufferLength() const {
     return mRequiresStorageBufferLength;
 }

 void ComputePipeline::InitializeAsync(Ref<ComputePipelineBase> computePipeline,
                                       WGPUCreateComputePipelineAsyncCallback callback,
                                       void* userdata) {
     PhysicalDeviceBase* physicalDevice = computePipeline->GetDevice()->GetPhysicalDevice();
     std::unique_ptr<CreateComputePipelineAsyncTask> asyncTask =
         std::make_unique<CreateComputePipelineAsyncTask>(std::move(computePipeline), callback,
                                                          userdata);
     // Workaround a crash where the validation layers on AMD crash with partition alloc.
     // See crbug.com/dawn/1200.
     if (IsMetalValidationEnabled(physicalDevice) &&
         gpu_info::IsAMD(physicalDevice->GetVendorId())) {
         asyncTask->Run();
         return;
     }
     CreateComputePipelineAsyncTask::RunAsync(std::move(asyncTask));
 }

 }  // namespace dawn::native::metal
	// Copyright 2017 The Dawn & Tint Authors
	//
	// Redistribution and use in source and binary forms, with or without
	// modification, are permitted provided that the following conditions are met:
	//
	// 1. Redistributions of source code must retain the above copyright notice, this
	// list of conditions and the following disclaimer.
	//
	// 2. Redistributions in binary form must reproduce the above copyright notice,
	// this list of conditions and the following disclaimer in the documentation
	// and/or other materials provided with the distribution.
	//
	// 3. Neither the name of the copyright holder nor the names of its
	// contributors may be used to endorse or promote products derived from
	// this software without specific prior written permission.
	//
	// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
	// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
	// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
	// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
	// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
	// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
	// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
	// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
	// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

	#include "dawn/native/metal/ComputePipelineMTL.h"

	#include "dawn/common/Math.h"
	#include "dawn/native/Adapter.h"
	#include "dawn/native/CreatePipelineAsyncTask.h"
	#include "dawn/native/Instance.h"
	#include "dawn/native/metal/BackendMTL.h"
	#include "dawn/native/metal/DeviceMTL.h"
	#include "dawn/native/metal/ShaderModuleMTL.h"
	#include "dawn/native/metal/UtilsMetal.h"
	#include "dawn/platform/metrics/HistogramMacros.h"

	namespace dawn::native::metal {

	// static
	Ref<ComputePipeline> ComputePipeline::CreateUninitialized(
	Device* device,
	const UnpackedPtr<ComputePipelineDescriptor>& descriptor) {
	return AcquireRef(new ComputePipeline(device, descriptor));
	}

	ComputePipeline::ComputePipeline(DeviceBase* dev,
	const UnpackedPtr<ComputePipelineDescriptor>& desc)
	: ComputePipelineBase(dev, desc) {}

	ComputePipeline::~ComputePipeline() = default;

	MaybeError ComputePipeline::InitializeImpl() {
	auto mtlDevice = ToBackend(GetDevice())->GetMTLDevice();

	const ProgrammableStage& computeStage = GetStage(SingleShaderStage::Compute);
	ShaderModule::MetalFunctionData computeData;

	DAWN_TRY(ToBackend(computeStage.module.Get())
	->CreateFunction(
	SingleShaderStage::Compute, computeStage, ToBackend(GetLayout()), &computeData,
	/* sampleMask */ 0xFFFFFFFF,
	/* renderPipeline */ nullptr,
	/* maxSubgroupSizeForFullSubgroups */
	IsFullSubgroupsRequired()
	? std::make_optional(
	GetDevice()->GetLimits().experimentalSubgroupLimits.maxSubgroupSize)
	: std::nullopt));

	NSError* error = nullptr;
	NSRef<NSString> label = MakeDebugName(GetDevice(), "Dawn_ComputePipeline", GetLabel());

	NSRef<MTLComputePipelineDescriptor> descriptorRef =
	AcquireNSRef([MTLComputePipelineDescriptor new]);
	MTLComputePipelineDescriptor* descriptor = descriptorRef.Get();
	descriptor.computeFunction = computeData.function.Get();
	descriptor.label = label.Get();

	if (IsFullSubgroupsRequired()) {
	descriptor.threadGroupSizeIsMultipleOfThreadExecutionWidth = true;
	}

	platform::metrics::DawnHistogramTimer timer(GetDevice()->GetPlatform());
	mMtlComputePipelineState.Acquire([mtlDevice
	newComputePipelineStateWithDescriptor:descriptor
	options:MTLPipelineOptionNone
	reflection:nil
	error:&error]);
	if (error != nullptr) {
	return DAWN_INTERNAL_ERROR("Error creating pipeline state " +
	std::string([error.localizedDescription UTF8String]));
	}
	DAWN_ASSERT(mMtlComputePipelineState != nil);
	timer.RecordMicroseconds("Metal.newComputePipelineStateWithDescriptor.CacheMiss");

	// Copy over the local workgroup size as it is passed to dispatch explicitly in Metal
	mLocalWorkgroupSize = computeData.localWorkgroupSize;

	mRequiresStorageBufferLength = computeData.needsStorageBufferLength;
	mWorkgroupAllocations = std::move(computeData.workgroupAllocations);
	return {};
	}

	void ComputePipeline::Encode(id<MTLComputeCommandEncoder> encoder) {
	[encoder setComputePipelineState:mMtlComputePipelineState.Get()];
	for (size_t i = 0; i < mWorkgroupAllocations.size(); ++i) {
	if (mWorkgroupAllocations[i] == 0) {
	continue;
	}
	// Size must be a multiple of 16 bytes.
	uint32_t rounded = Align<uint32_t>(mWorkgroupAllocations[i], 16);
	[encoder setThreadgroupMemoryLength:rounded atIndex:i];
	}
	}

	MTLSize ComputePipeline::GetLocalWorkGroupSize() const {
	return mLocalWorkgroupSize;
	}

	bool ComputePipeline::RequiresStorageBufferLength() const {
	return mRequiresStorageBufferLength;
	}

	void ComputePipeline::InitializeAsync(Ref<ComputePipelineBase> computePipeline,
	WGPUCreateComputePipelineAsyncCallback callback,
	void* userdata) {
	PhysicalDeviceBase* physicalDevice = computePipeline->GetDevice()->GetPhysicalDevice();
	std::unique_ptr<CreateComputePipelineAsyncTask> asyncTask =
	std::make_unique<CreateComputePipelineAsyncTask>(std::move(computePipeline), callback,
	userdata);
	// Workaround a crash where the validation layers on AMD crash with partition alloc.
	// See crbug.com/dawn/1200.
	if (IsMetalValidationEnabled(physicalDevice) &&
	gpu_info::IsAMD(physicalDevice->GetVendorId())) {
	asyncTask->Run();
	return;
	}
	CreateComputePipelineAsyncTask::RunAsync(std::move(asyncTask));
	}

	} // namespace dawn::native::metal