blob: a414f7aecf38cb5ef99b7e9b922511c891f00c06 [file] [log] [blame]
// Copyright 2023 The Dawn & Tint Authors
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// 1. Redistributions of source code must retain the above copyright notice, this
// list of conditions and the following disclaimer.
//
// 2. Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
//
// 3. Neither the name of the copyright holder nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
#include "src/tint/lang/spirv/writer/raise/builtin_polyfill.h"
#include <utility>
#include "spirv/unified1/spirv.h"
#include "src/tint/lang/core/fluent_types.h"
#include "src/tint/lang/core/ir/builder.h"
#include "src/tint/lang/core/ir/module.h"
#include "src/tint/lang/core/ir/validator.h"
#include "src/tint/lang/core/type/builtin_structs.h"
#include "src/tint/lang/core/type/depth_multisampled_texture.h"
#include "src/tint/lang/core/type/depth_texture.h"
#include "src/tint/lang/core/type/input_attachment.h"
#include "src/tint/lang/core/type/multisampled_texture.h"
#include "src/tint/lang/core/type/sampled_texture.h"
#include "src/tint/lang/core/type/storage_texture.h"
#include "src/tint/lang/core/type/texture.h"
#include "src/tint/lang/spirv/ir/builtin_call.h"
#include "src/tint/lang/spirv/ir/literal_operand.h"
#include "src/tint/lang/spirv/type/sampled_image.h"
#include "src/tint/utils/ice/ice.h"
using namespace tint::core::number_suffixes; // NOLINT
using namespace tint::core::fluent_types; // NOLINT
namespace tint::spirv::writer::raise {
namespace {
/// PIMPL state for the transform.
struct State {
/// The IR module.
core::ir::Module& ir;
/// If we should use the vulkan memory model
bool use_vulkan_memory_model = false;
/// The IR builder.
core::ir::Builder b{ir};
/// The type manager.
core::type::Manager& ty{ir.Types()};
/// Process the module.
void Process() {
// Find the builtins that need replacing.
Vector<core::ir::CoreBuiltinCall*, 4> worklist;
for (auto* inst : ir.Instructions()) {
if (auto* builtin = inst->As<core::ir::CoreBuiltinCall>()) {
switch (builtin->Func()) {
case core::BuiltinFn::kArrayLength:
case core::BuiltinFn::kAtomicAdd:
case core::BuiltinFn::kAtomicAnd:
case core::BuiltinFn::kAtomicCompareExchangeWeak:
case core::BuiltinFn::kAtomicExchange:
case core::BuiltinFn::kAtomicLoad:
case core::BuiltinFn::kAtomicMax:
case core::BuiltinFn::kAtomicMin:
case core::BuiltinFn::kAtomicOr:
case core::BuiltinFn::kAtomicStore:
case core::BuiltinFn::kAtomicSub:
case core::BuiltinFn::kAtomicXor:
case core::BuiltinFn::kDot:
case core::BuiltinFn::kDot4I8Packed:
case core::BuiltinFn::kDot4U8Packed:
case core::BuiltinFn::kQuadBroadcast:
case core::BuiltinFn::kSelect:
case core::BuiltinFn::kSubgroupBroadcast:
case core::BuiltinFn::kSubgroupShuffle:
case core::BuiltinFn::kTextureDimensions:
case core::BuiltinFn::kTextureGather:
case core::BuiltinFn::kTextureGatherCompare:
case core::BuiltinFn::kTextureLoad:
case core::BuiltinFn::kTextureNumLayers:
case core::BuiltinFn::kTextureSample:
case core::BuiltinFn::kTextureSampleBias:
case core::BuiltinFn::kTextureSampleCompare:
case core::BuiltinFn::kTextureSampleCompareLevel:
case core::BuiltinFn::kTextureSampleGrad:
case core::BuiltinFn::kTextureSampleLevel:
case core::BuiltinFn::kTextureStore:
case core::BuiltinFn::kInputAttachmentLoad:
worklist.Push(builtin);
break;
case core::BuiltinFn::kQuantizeToF16:
if (builtin->Result(0)->Type()->Is<core::type::Vector>()) {
worklist.Push(builtin);
}
break;
default:
break;
}
}
}
// Replace the builtins that we found.
for (auto* builtin : worklist) {
switch (builtin->Func()) {
case core::BuiltinFn::kArrayLength:
ArrayLength(builtin);
break;
case core::BuiltinFn::kAtomicAdd:
case core::BuiltinFn::kAtomicAnd:
case core::BuiltinFn::kAtomicCompareExchangeWeak:
case core::BuiltinFn::kAtomicExchange:
case core::BuiltinFn::kAtomicLoad:
case core::BuiltinFn::kAtomicMax:
case core::BuiltinFn::kAtomicMin:
case core::BuiltinFn::kAtomicOr:
case core::BuiltinFn::kAtomicStore:
case core::BuiltinFn::kAtomicSub:
case core::BuiltinFn::kAtomicXor:
Atomic(builtin);
break;
case core::BuiltinFn::kDot:
Dot(builtin);
break;
case core::BuiltinFn::kDot4I8Packed:
case core::BuiltinFn::kDot4U8Packed:
DotPacked4x8(builtin);
break;
case core::BuiltinFn::kQuadBroadcast:
QuadBroadcast(builtin);
break;
case core::BuiltinFn::kSelect:
Select(builtin);
break;
case core::BuiltinFn::kSubgroupBroadcast:
SubgroupBroadcast(builtin);
break;
case core::BuiltinFn::kSubgroupShuffle:
SubgroupShuffle(builtin);
break;
case core::BuiltinFn::kTextureDimensions:
TextureDimensions(builtin);
break;
case core::BuiltinFn::kTextureGather:
case core::BuiltinFn::kTextureGatherCompare:
TextureGather(builtin);
break;
case core::BuiltinFn::kTextureLoad:
TextureLoad(builtin);
break;
case core::BuiltinFn::kTextureNumLayers:
TextureNumLayers(builtin);
break;
case core::BuiltinFn::kTextureSample:
case core::BuiltinFn::kTextureSampleBias:
case core::BuiltinFn::kTextureSampleCompare:
case core::BuiltinFn::kTextureSampleCompareLevel:
case core::BuiltinFn::kTextureSampleGrad:
case core::BuiltinFn::kTextureSampleLevel:
TextureSample(builtin);
break;
case core::BuiltinFn::kTextureStore:
TextureStore(builtin);
break;
case core::BuiltinFn::kQuantizeToF16:
QuantizeToF16Vec(builtin);
break;
case core::BuiltinFn::kInputAttachmentLoad:
InputAttachmentLoad(builtin);
break;
default:
break;
}
}
}
/// Create a literal operand.
/// @param value the literal value
/// @returns the literal operand
spirv::ir::LiteralOperand* Literal(u32 value) {
return ir.CreateValue<spirv::ir::LiteralOperand>(b.ConstantValue(value));
}
/// Handle an `arrayLength()` builtin.
/// @param builtin the builtin call instruction
void ArrayLength(core::ir::CoreBuiltinCall* builtin) {
// Strip away any let instructions to get to the original struct member access instruction.
auto* ptr = builtin->Args()[0]->As<core::ir::InstructionResult>();
while (auto* let = tint::As<core::ir::Let>(ptr->Instruction())) {
ptr = let->Value()->As<core::ir::InstructionResult>();
}
TINT_ASSERT(ptr);
auto* access = ptr->Instruction()->As<core::ir::Access>();
TINT_ASSERT(access);
TINT_ASSERT(access->Indices().Length() == 1u);
TINT_ASSERT(access->Object()->Type()->UnwrapPtr()->Is<core::type::Struct>());
auto* const_idx = access->Indices()[0]->As<core::ir::Constant>();
// Replace the builtin call with a call to the spirv.array_length intrinsic.
auto* call = b.CallWithResult<spirv::ir::BuiltinCall>(
builtin->DetachResult(), spirv::BuiltinFn::kArrayLength,
Vector{access->Object(), Literal(u32(const_idx->Value()->ValueAs<uint32_t>()))});
call->InsertBefore(builtin);
builtin->Destroy();
}
/// Handle an atomic*() builtin.
/// @param builtin the builtin call instruction
void Atomic(core::ir::CoreBuiltinCall* builtin) {
auto* result_ty = builtin->Result(0)->Type();
auto* pointer = builtin->Args()[0];
auto* memory = [&]() -> core::ir::Value* {
switch (pointer->Type()->As<core::type::Pointer>()->AddressSpace()) {
case core::AddressSpace::kWorkgroup:
return b.Constant(u32(SpvScopeWorkgroup));
case core::AddressSpace::kStorage:
return b.Constant(u32(SpvScopeDevice));
default:
TINT_UNREACHABLE() << "unhandled atomic address space";
}
}();
auto* memory_semantics = b.Constant(u32(SpvMemorySemanticsMaskNone));
// Helper to build the builtin call with the common operands.
auto build = [&](enum spirv::BuiltinFn builtin_fn) {
return b.CallWithResult<spirv::ir::BuiltinCall>(builtin->DetachResult(), builtin_fn,
pointer, memory, memory_semantics);
};
// Create the replacement call instruction.
core::ir::Call* call = nullptr;
switch (builtin->Func()) {
case core::BuiltinFn::kAtomicAdd:
call = build(spirv::BuiltinFn::kAtomicIadd);
call->AppendArg(builtin->Args()[1]);
break;
case core::BuiltinFn::kAtomicAnd:
call = build(spirv::BuiltinFn::kAtomicAnd);
call->AppendArg(builtin->Args()[1]);
break;
case core::BuiltinFn::kAtomicCompareExchangeWeak: {
auto* cmp = builtin->Args()[1];
auto* value = builtin->Args()[2];
auto* int_ty = value->Type();
call =
b.Call<spirv::ir::BuiltinCall>(int_ty, spirv::BuiltinFn::kAtomicCompareExchange,
pointer, memory, memory_semantics);
call->AppendArg(memory_semantics);
call->AppendArg(value);
call->AppendArg(cmp);
call->InsertBefore(builtin);
// Compare the original value to the comparator to see if an exchange happened.
auto* original = call->Result(0);
auto* compare = b.Equal(ty.bool_(), original, cmp);
compare->InsertBefore(builtin);
// Construct the atomicCompareExchange result structure.
call = b.ConstructWithResult(builtin->DetachResult(),
Vector{original, compare->Result(0)});
break;
}
case core::BuiltinFn::kAtomicExchange:
call = build(spirv::BuiltinFn::kAtomicExchange);
call->AppendArg(builtin->Args()[1]);
break;
case core::BuiltinFn::kAtomicLoad:
call = build(spirv::BuiltinFn::kAtomicLoad);
break;
case core::BuiltinFn::kAtomicOr:
call = build(spirv::BuiltinFn::kAtomicOr);
call->AppendArg(builtin->Args()[1]);
break;
case core::BuiltinFn::kAtomicMax:
if (result_ty->IsSignedIntegerScalar()) {
call = build(spirv::BuiltinFn::kAtomicSmax);
} else {
call = build(spirv::BuiltinFn::kAtomicUmax);
}
call->AppendArg(builtin->Args()[1]);
break;
case core::BuiltinFn::kAtomicMin:
if (result_ty->IsSignedIntegerScalar()) {
call = build(spirv::BuiltinFn::kAtomicSmin);
} else {
call = build(spirv::BuiltinFn::kAtomicUmin);
}
call->AppendArg(builtin->Args()[1]);
break;
case core::BuiltinFn::kAtomicStore:
call = build(spirv::BuiltinFn::kAtomicStore);
call->AppendArg(builtin->Args()[1]);
break;
case core::BuiltinFn::kAtomicSub:
call = build(spirv::BuiltinFn::kAtomicIsub);
call->AppendArg(builtin->Args()[1]);
break;
case core::BuiltinFn::kAtomicXor:
call = build(spirv::BuiltinFn::kAtomicXor);
call->AppendArg(builtin->Args()[1]);
break;
default:
TINT_UNREACHABLE() << "unhandled atomic builtin";
}
call->InsertBefore(builtin);
builtin->Destroy();
}
/// Handle a `dot()` builtin.
/// @param builtin the builtin call instruction
void Dot(core::ir::CoreBuiltinCall* builtin) {
// OpDot only supports floating point operands, so we need to polyfill the integer case.
// TODO(crbug.com/tint/1267): If SPV_KHR_integer_dot_product is supported, use that instead.
if (builtin->Result(0)->Type()->IsIntegerScalar()) {
core::ir::Instruction* sum = nullptr;
auto* v1 = builtin->Args()[0];
auto* v2 = builtin->Args()[1];
auto* vec = v1->Type()->As<core::type::Vector>();
auto* elty = vec->Type();
for (uint32_t i = 0; i < vec->Width(); i++) {
b.InsertBefore(builtin, [&] {
auto* e1 = b.Access(elty, v1, u32(i));
auto* e2 = b.Access(elty, v2, u32(i));
auto* mul = b.Multiply(elty, e1, e2);
if (sum) {
sum = b.Add(elty, sum, mul);
} else {
sum = mul;
}
});
}
sum->SetResults(Vector{builtin->DetachResult()});
builtin->Destroy();
return;
}
// Replace the builtin call with a call to the spirv.dot intrinsic.
auto args = Vector<core::ir::Value*, 4>(builtin->Args());
auto* call = b.CallWithResult<spirv::ir::BuiltinCall>(
builtin->DetachResult(), spirv::BuiltinFn::kDot, std::move(args));
call->InsertBefore(builtin);
builtin->Destroy();
}
/// Handle a `dot4{I,U}8Packed()` builtin.
/// @param builtin the builtin call instruction
void DotPacked4x8(core::ir::CoreBuiltinCall* builtin) {
// Replace the builtin call with a call to the spirv.{s,u}dot intrinsic.
auto is_signed = builtin->Func() == core::BuiltinFn::kDot4I8Packed;
auto inst = is_signed ? spirv::BuiltinFn::kSdot : spirv::BuiltinFn::kUdot;
auto args = Vector<core::ir::Value*, 3>(builtin->Args());
args.Push(Literal(u32(SpvPackedVectorFormatPackedVectorFormat4x8Bit)));
auto* call = b.CallWithResult<spirv::ir::BuiltinCall>(builtin->DetachResult(), inst,
std::move(args));
call->InsertBefore(builtin);
builtin->Destroy();
}
/// Handle a `select()` builtin.
/// @param builtin the builtin call instruction
void Select(core::ir::CoreBuiltinCall* builtin) {
// Argument order is different in SPIR-V: (condition, true_operand, false_operand).
Vector<core::ir::Value*, 4> args = {
builtin->Args()[2],
builtin->Args()[1],
builtin->Args()[0],
};
// If the condition is scalar and the objects are vectors, we need to splat the condition
// into a vector of the same size.
// TODO(jrprice): We don't need to do this if we're targeting SPIR-V 1.4 or newer.
auto* vec = builtin->Result(0)->Type()->As<core::type::Vector>();
if (vec && args[0]->Type()->Is<core::type::Scalar>()) {
Vector<core::ir::Value*, 4> elements;
elements.Resize(vec->Width(), args[0]);
auto* construct = b.Construct(ty.vec(ty.bool_(), vec->Width()), std::move(elements));
construct->InsertBefore(builtin);
args[0] = construct->Result(0);
}
// Replace the builtin call with a call to the spirv.select intrinsic.
auto* call = b.CallWithResult<spirv::ir::BuiltinCall>(
builtin->DetachResult(), spirv::BuiltinFn::kSelect, std::move(args));
call->InsertBefore(builtin);
builtin->Destroy();
}
/// ImageOperands represents the optional image operands for an image instruction.
struct ImageOperands {
/// Bias
core::ir::Value* bias = nullptr;
/// Lod
core::ir::Value* lod = nullptr;
/// Grad (dx)
core::ir::Value* ddx = nullptr;
/// Grad (dy)
core::ir::Value* ddy = nullptr;
/// ConstOffset
core::ir::Value* offset = nullptr;
/// Sample
core::ir::Value* sample = nullptr;
};
/// Append optional image operands to an image intrinsic argument list.
/// @param operands the operands
/// @param args the argument list
/// @param insertion_point the insertion point for new instructions
/// @param requires_float_lod true if the lod needs to be a floating point value
void AppendImageOperands(ImageOperands& operands,
Vector<core::ir::Value*, 8>& args,
core::ir::CoreBuiltinCall* insertion_point,
bool requires_float_lod) {
// Add a placeholder argument for the image operand mask, which we will fill in when we have
// processed the image operands.
uint32_t image_operand_mask = 0u;
size_t mask_idx = args.Length();
args.Push(nullptr);
// Append the NonPrivateTexel flag to Read/Write storage textures when we load/store them.
if (use_vulkan_memory_model) {
if (insertion_point->Func() == core::BuiltinFn::kTextureLoad ||
insertion_point->Func() == core::BuiltinFn::kTextureStore) {
if (auto* st =
insertion_point->Args()[0]->Type()->As<core::type::StorageTexture>()) {
if (st->Access() == core::Access::kReadWrite) {
image_operand_mask |= SpvImageOperandsNonPrivateTexelMask;
}
}
}
}
// Add each of the optional image operands if used, updating the image operand mask.
if (operands.bias) {
image_operand_mask |= SpvImageOperandsBiasMask;
args.Push(operands.bias);
}
if (operands.lod) {
image_operand_mask |= SpvImageOperandsLodMask;
if (requires_float_lod && operands.lod->Type()->IsIntegerScalar()) {
auto* convert = b.Convert(ty.f32(), operands.lod);
convert->InsertBefore(insertion_point);
operands.lod = convert->Result(0);
}
args.Push(operands.lod);
}
if (operands.ddx) {
image_operand_mask |= SpvImageOperandsGradMask;
args.Push(operands.ddx);
args.Push(operands.ddy);
}
if (operands.offset) {
image_operand_mask |= SpvImageOperandsConstOffsetMask;
args.Push(operands.offset);
}
if (operands.sample) {
image_operand_mask |= SpvImageOperandsSampleMask;
args.Push(operands.sample);
}
// Replace the image operand mask with the final mask value, as a literal operand.
args[mask_idx] = Literal(u32(image_operand_mask));
}
/// Append an array index to a coordinate vector.
/// @param coords the coordinate vector
/// @param array_idx the array index
/// @param insertion_point the insertion point for new instructions
/// @returns the modified coordinate vector
core::ir::Value* AppendArrayIndex(core::ir::Value* coords,
core::ir::Value* array_idx,
core::ir::Instruction* insertion_point) {
auto* vec = coords->Type()->As<core::type::Vector>();
auto* element_ty = vec->Type();
// Convert the index to match the coordinate type if needed.
if (array_idx->Type() != element_ty) {
auto* array_idx_converted = b.Convert(element_ty, array_idx);
array_idx_converted->InsertBefore(insertion_point);
array_idx = array_idx_converted->Result(0);
}
// Construct a new coordinate vector.
auto num_coords = vec->Width();
auto* coord_ty = ty.vec(element_ty, num_coords + 1);
auto* construct = b.Construct(coord_ty, Vector{coords, array_idx});
construct->InsertBefore(insertion_point);
return construct->Result(0);
}
/// Handle a textureSample*() builtin.
/// @param builtin the builtin call instruction
void TextureSample(core::ir::CoreBuiltinCall* builtin) {
// Helper to get the next argument from the call, or nullptr if there are no more arguments.
uint32_t arg_idx = 0;
auto next_arg = [&]() {
return arg_idx < builtin->Args().Length() ? builtin->Args()[arg_idx++] : nullptr;
};
auto* texture = next_arg();
auto* sampler = next_arg();
auto* coords = next_arg();
auto* texture_ty = texture->Type()->As<core::type::Texture>();
// Use OpSampledImage to create an OpTypeSampledImage object.
auto* sampled_image = b.Call<spirv::ir::BuiltinCall>(ty.Get<type::SampledImage>(texture_ty),
spirv::BuiltinFn::kSampledImage,
Vector{texture, sampler});
sampled_image->InsertBefore(builtin);
// Append the array index to the coordinates if provided.
auto* array_idx = IsTextureArray(texture_ty->Dim()) ? next_arg() : nullptr;
if (array_idx) {
coords = AppendArrayIndex(coords, array_idx, builtin);
}
// Determine which SPIR-V function to use and which optional image operands are needed.
enum spirv::BuiltinFn function = BuiltinFn::kNone;
core::ir::Value* depth = nullptr;
ImageOperands operands;
switch (builtin->Func()) {
case core::BuiltinFn::kTextureSample:
function = spirv::BuiltinFn::kImageSampleImplicitLod;
operands.offset = next_arg();
break;
case core::BuiltinFn::kTextureSampleBias:
function = spirv::BuiltinFn::kImageSampleImplicitLod;
operands.bias = next_arg();
operands.offset = next_arg();
break;
case core::BuiltinFn::kTextureSampleCompare:
function = spirv::BuiltinFn::kImageSampleDrefImplicitLod;
depth = next_arg();
operands.offset = next_arg();
break;
case core::BuiltinFn::kTextureSampleCompareLevel:
function = spirv::BuiltinFn::kImageSampleDrefExplicitLod;
depth = next_arg();
operands.lod = b.Constant(0_f);
operands.offset = next_arg();
break;
case core::BuiltinFn::kTextureSampleGrad:
function = spirv::BuiltinFn::kImageSampleExplicitLod;
operands.ddx = next_arg();
operands.ddy = next_arg();
operands.offset = next_arg();
break;
case core::BuiltinFn::kTextureSampleLevel:
function = spirv::BuiltinFn::kImageSampleExplicitLod;
operands.lod = next_arg();
operands.offset = next_arg();
break;
default:
TINT_UNREACHABLE() << "unhandled texture sample builtin";
}
// Start building the argument list for the function.
// The first two operands are always the sampled image and then the coordinates, followed by
// the depth reference if used.
Vector<core::ir::Value*, 8> function_args;
function_args.Push(sampled_image->Result(0));
function_args.Push(coords);
if (depth) {
function_args.Push(depth);
}
// Add the optional image operands, if any.
AppendImageOperands(operands, function_args, builtin, /* requires_float_lod */ true);
// Call the function.
// If this is a depth comparison, the result is always f32, otherwise vec4f.
auto* result_ty = depth ? static_cast<const core::type::Type*>(ty.f32()) : ty.vec4<f32>();
core::ir::Instruction* result =
b.Call<spirv::ir::BuiltinCall>(result_ty, function, std::move(function_args));
result->InsertBefore(builtin);
// If this is not a depth comparison but we are sampling a depth texture, extract the first
// component to get the scalar f32 that SPIR-V expects.
if (!depth &&
texture_ty->IsAnyOf<core::type::DepthTexture, core::type::DepthMultisampledTexture>()) {
result = b.Access(ty.f32(), result, 0_u);
result->InsertBefore(builtin);
}
result->SetResults(Vector{builtin->DetachResult()});
builtin->Destroy();
}
/// Handle a textureGather*() builtin.
/// @param builtin the builtin call instruction
void TextureGather(core::ir::CoreBuiltinCall* builtin) {
// Helper to get the next argument from the call, or nullptr if there are no more arguments.
uint32_t arg_idx = 0;
auto next_arg = [&]() {
return arg_idx < builtin->Args().Length() ? builtin->Args()[arg_idx++] : nullptr;
};
auto* component = next_arg();
if (!component->Type()->IsIntegerScalar()) {
// The first argument wasn't the component, so it must be the texture instead.
// Use constant zero for the component.
component = b.Constant(0_u);
arg_idx--;
}
auto* texture = next_arg();
auto* sampler = next_arg();
auto* coords = next_arg();
auto* texture_ty = texture->Type()->As<core::type::Texture>();
// Use OpSampledImage to create an OpTypeSampledImage object.
auto* sampled_image = b.Call<spirv::ir::BuiltinCall>(ty.Get<type::SampledImage>(texture_ty),
spirv::BuiltinFn::kSampledImage,
Vector{texture, sampler});
sampled_image->InsertBefore(builtin);
// Append the array index to the coordinates if provided.
auto* array_idx = IsTextureArray(texture_ty->Dim()) ? next_arg() : nullptr;
if (array_idx) {
coords = AppendArrayIndex(coords, array_idx, builtin);
}
// Determine which SPIR-V function to use and which optional image operands are needed.
enum spirv::BuiltinFn function = BuiltinFn::kNone;
core::ir::Value* depth = nullptr;
ImageOperands operands;
switch (builtin->Func()) {
case core::BuiltinFn::kTextureGather:
function = spirv::BuiltinFn::kImageGather;
operands.offset = next_arg();
break;
case core::BuiltinFn::kTextureGatherCompare:
function = spirv::BuiltinFn::kImageDrefGather;
depth = next_arg();
operands.offset = next_arg();
break;
default:
TINT_UNIMPLEMENTED() << "unhandled texture gather builtin";
}
// Start building the argument list for the function.
// The first two operands are always the sampled image and then the coordinates, followed by
// either the depth reference or the component.
Vector<core::ir::Value*, 8> function_args;
function_args.Push(sampled_image->Result(0));
function_args.Push(coords);
if (depth) {
function_args.Push(depth);
} else {
function_args.Push(component);
}
// Add the optional image operands, if any.
AppendImageOperands(operands, function_args, builtin, /* requires_float_lod */ true);
// Call the function.
auto* texture_call = b.CallWithResult<spirv::ir::BuiltinCall>(
builtin->DetachResult(), function, std::move(function_args));
texture_call->InsertBefore(builtin);
builtin->Destroy();
}
/// Handle a textureLoad() builtin.
/// @param builtin the builtin call instruction
void TextureLoad(core::ir::CoreBuiltinCall* builtin) {
// Helper to get the next argument from the call, or nullptr if there are no more arguments.
uint32_t arg_idx = 0;
auto next_arg = [&]() {
return arg_idx < builtin->Args().Length() ? builtin->Args()[arg_idx++] : nullptr;
};
auto* texture = next_arg();
auto* coords = next_arg();
auto* texture_ty = texture->Type()->As<core::type::Texture>();
// Append the array index to the coordinates if provided.
auto* array_idx = IsTextureArray(texture_ty->Dim()) ? next_arg() : nullptr;
if (array_idx) {
coords = AppendArrayIndex(coords, array_idx, builtin);
}
// Start building the argument list for the builtin.
// The first two operands are always the texture and then the coordinates.
Vector<core::ir::Value*, 8> builtin_args;
builtin_args.Push(texture);
builtin_args.Push(coords);
// Add the optional image operands, if any.
ImageOperands operands;
if (texture_ty->IsAnyOf<core::type::MultisampledTexture,
core::type::DepthMultisampledTexture>()) {
operands.sample = next_arg();
} else {
operands.lod = next_arg();
}
AppendImageOperands(operands, builtin_args, builtin, /* requires_float_lod */ false);
// Call the builtin.
// The result is always a vec4 in SPIR-V.
auto* result_ty = builtin->Result(0)->Type();
bool expects_scalar_result = result_ty->Is<core::type::Scalar>();
if (expects_scalar_result) {
result_ty = ty.vec4(result_ty);
}
auto kind = texture_ty->Is<core::type::StorageTexture>() ? spirv::BuiltinFn::kImageRead
: spirv::BuiltinFn::kImageFetch;
core::ir::Instruction* result =
b.Call<spirv::ir::BuiltinCall>(result_ty, kind, std::move(builtin_args));
result->InsertBefore(builtin);
// If we are expecting a scalar result, extract the first component.
if (expects_scalar_result) {
result = b.Access(ty.f32(), result, 0_u);
result->InsertBefore(builtin);
}
result->SetResults(Vector{builtin->DetachResult()});
builtin->Destroy();
}
/// Handle a textureStore() builtin.
/// @param builtin the builtin call instruction
void TextureStore(core::ir::CoreBuiltinCall* builtin) {
// Helper to get the next argument from the call, or nullptr if there are no more arguments.
uint32_t arg_idx = 0;
auto next_arg = [&]() {
return arg_idx < builtin->Args().Length() ? builtin->Args()[arg_idx++] : nullptr;
};
auto* texture = next_arg();
auto* coords = next_arg();
auto* texture_ty = texture->Type()->As<core::type::Texture>();
// Append the array index to the coordinates if provided.
auto* array_idx = IsTextureArray(texture_ty->Dim()) ? next_arg() : nullptr;
if (array_idx) {
coords = AppendArrayIndex(coords, array_idx, builtin);
}
auto* texel = next_arg();
// Start building the argument list for the function.
// The first two operands are always the texture and then the coordinates.
Vector<core::ir::Value*, 8> function_args;
function_args.Push(texture);
function_args.Push(coords);
function_args.Push(texel);
ImageOperands operands;
AppendImageOperands(operands, function_args, builtin, /* requires_float_lod */ false);
// Call the function.
auto* texture_call = b.Call<spirv::ir::BuiltinCall>(
ty.void_(), spirv::BuiltinFn::kImageWrite, std::move(function_args));
texture_call->InsertBefore(builtin);
builtin->Destroy();
}
/// Handle a textureDimensions() builtin.
/// @param builtin the builtin call instruction
void TextureDimensions(core::ir::CoreBuiltinCall* builtin) {
// Helper to get the next argument from the call, or nullptr if there are no more arguments.
uint32_t arg_idx = 0;
auto next_arg = [&]() {
return arg_idx < builtin->Args().Length() ? builtin->Args()[arg_idx++] : nullptr;
};
auto* texture = next_arg();
auto* texture_ty = texture->Type()->As<core::type::Texture>();
Vector<core::ir::Value*, 8> function_args;
function_args.Push(texture);
// Determine which SPIR-V function to use, and add the Lod argument if needed.
enum spirv::BuiltinFn function;
if (texture_ty
->IsAnyOf<core::type::MultisampledTexture, core::type::DepthMultisampledTexture,
core::type::StorageTexture>()) {
function = spirv::BuiltinFn::kImageQuerySize;
} else {
function = spirv::BuiltinFn::kImageQuerySizeLod;
if (auto* lod = next_arg()) {
function_args.Push(lod);
} else {
// Lod wasn't explicit, so assume 0.
function_args.Push(b.Constant(0_u));
}
}
// Add an extra component to the result vector for arrayed textures.
auto* result_ty = builtin->Result(0)->Type();
if (core::type::IsTextureArray(texture_ty->Dim())) {
auto* vec = result_ty->As<core::type::Vector>();
result_ty = ty.vec(vec->Type(), vec->Width() + 1);
}
// Call the function.
core::ir::Instruction* result =
b.Call<spirv::ir::BuiltinCall>(result_ty, function, std::move(function_args));
result->InsertBefore(builtin);
// Swizzle the first two components from the result for arrayed textures.
if (core::type::IsTextureArray(texture_ty->Dim())) {
result = b.Swizzle(builtin->Result(0)->Type(), result, {0, 1});
result->InsertBefore(builtin);
}
result->SetResults(Vector{builtin->DetachResult()});
builtin->Destroy();
}
/// Handle a textureNumLayers() builtin.
/// @param builtin the builtin call instruction
void TextureNumLayers(core::ir::CoreBuiltinCall* builtin) {
auto* texture = builtin->Args()[0];
auto* texture_ty = texture->Type()->As<core::type::Texture>();
Vector<core::ir::Value*, 2> function_args;
function_args.Push(texture);
// Determine which SPIR-V function to use, and add the Lod argument if needed.
enum spirv::BuiltinFn function;
if (texture_ty
->IsAnyOf<core::type::MultisampledTexture, core::type::DepthMultisampledTexture,
core::type::StorageTexture>()) {
function = spirv::BuiltinFn::kImageQuerySize;
} else {
function = spirv::BuiltinFn::kImageQuerySizeLod;
function_args.Push(b.Constant(0_u));
}
// Call the function.
auto* texture_call =
b.Call<spirv::ir::BuiltinCall>(ty.vec3<u32>(), function, std::move(function_args));
texture_call->InsertBefore(builtin);
// Extract the third component to get the number of array layers.
auto* extract = b.AccessWithResult(builtin->DetachResult(), texture_call->Result(0), 2_u);
extract->InsertBefore(builtin);
builtin->Destroy();
}
/// Scalarize the vector form of a `quantizeToF16()` builtin.
/// See crbug.com/tint/1741.
/// @param builtin the builtin call instruction
void QuantizeToF16Vec(core::ir::CoreBuiltinCall* builtin) {
auto* arg = builtin->Args()[0];
auto* vec = arg->Type()->As<core::type::Vector>();
TINT_ASSERT(vec);
// Replace the builtin call with a call to the spirv.dot intrinsic.
Vector<core::ir::Value*, 4> args;
for (uint32_t i = 0; i < vec->Width(); i++) {
auto* el = b.Access(ty.f32(), arg, u32(i));
auto* scalar_call = b.Call(ty.f32(), core::BuiltinFn::kQuantizeToF16, el);
args.Push(scalar_call->Result(0));
el->InsertBefore(builtin);
scalar_call->InsertBefore(builtin);
}
auto* construct = b.ConstructWithResult(builtin->DetachResult(), std::move(args));
construct->InsertBefore(builtin);
builtin->Destroy();
}
/// Handle an inputAttachmentLoad() builtin.
/// @param builtin the builtin call instruction
void InputAttachmentLoad(core::ir::CoreBuiltinCall* builtin) {
TINT_ASSERT(builtin->Args().Length() == 1);
auto* texture = builtin->Args()[0];
// coords for input_attachment are always (0, 0)
auto* coords = b.Composite(ty.vec2<i32>(), 0_i, 0_i);
// Start building the argument list for the builtin.
// The first two operands are always the texture and then the coordinates.
Vector<core::ir::Value*, 8> builtin_args;
builtin_args.Push(texture);
builtin_args.Push(coords);
// Call the builtin.
// The result is always a vec4 in SPIR-V.
auto* result_ty = builtin->Result(0)->Type();
TINT_ASSERT(result_ty->Is<core::type::Vector>());
core::ir::Instruction* result = b.Call<spirv::ir::BuiltinCall>(
result_ty, spirv::BuiltinFn::kImageRead, std::move(builtin_args));
result->InsertBefore(builtin);
result->SetResults(Vector{builtin->DetachResult()});
builtin->Destroy();
}
/// Handle a SubgroupShuffle() builtin.
/// @param builtin the builtin call instruction
void SubgroupShuffle(core::ir::CoreBuiltinCall* builtin) {
TINT_ASSERT(builtin->Args().Length() == 2);
auto* id = builtin->Args()[1];
// Id must be an unsigned integer scalar, so bitcast if necessary.
if (id->Type()->IsSignedIntegerScalar()) {
auto* cast = b.Bitcast(ty.u32(), id);
cast->InsertBefore(builtin);
builtin->SetArg(1, cast->Result(0));
}
}
/// Handle a SubgroupBroadcast() builtin.
/// @param builtin the builtin call instruction
void SubgroupBroadcast(core::ir::CoreBuiltinCall* builtin) {
TINT_ASSERT(builtin->Args().Length() == 2);
auto* id = builtin->Args()[1];
TINT_ASSERT(id->Is<core::ir::Constant>());
// For const signed int IDs, compile-time convert to u32 to maintain constness.
if (id->Type()->IsSignedIntegerScalar()) {
builtin->SetArg(1, b.Constant(id->As<core::ir::Constant>()->Value()->ValueAs<u32>()));
}
}
/// Handle a QuadBroadcast() builtin.
/// @param builtin the builtin call instruction
void QuadBroadcast(core::ir::CoreBuiltinCall* builtin) {
TINT_ASSERT(builtin->Args().Length() == 2);
auto* id = builtin->Args()[1];
TINT_ASSERT(id->Is<core::ir::Constant>());
// For const signed int IDs, compile-time convert to u32 to maintain constness.
if (id->Type()->IsSignedIntegerScalar()) {
builtin->SetArg(1, b.Constant(id->As<core::ir::Constant>()->Value()->ValueAs<u32>()));
}
}
};
} // namespace
Result<SuccessType> BuiltinPolyfill(core::ir::Module& ir, bool use_vulkan_memory_model) {
auto result = ValidateAndDumpIfNeeded(ir, "BuiltinPolyfill transform");
if (result != Success) {
return result.Failure();
}
State{ir, use_vulkan_memory_model}.Process();
return Success;
}
} // namespace tint::spirv::writer::raise