blob: b1d91297651a5c86ad0e579b4846656d9690fe0e [file] [log] [blame]
#include <metal_stdlib>
using namespace metal;
struct Uniforms {
uint numTriangles;
uint gridSize;
uint puuuuuuuuuuuuuuuuad1;
uint pad2;
float3 bbMin;
float3 bbMax;
};
template<typename T, size_t N>
struct tint_array {
const constant T& operator[](size_t i) const constant { return elements[i]; }
device T& operator[](size_t i) device { return elements[i]; }
const device T& operator[](size_t i) const device { return elements[i]; }
thread T& operator[](size_t i) thread { return elements[i]; }
const thread T& operator[](size_t i) const thread { return elements[i]; }
threadgroup T& operator[](size_t i) threadgroup { return elements[i]; }
const threadgroup T& operator[](size_t i) const threadgroup { return elements[i]; }
T elements[N];
};
struct U32s {
tint_array<uint, 1> values;
};
struct F32s {
tint_array<float, 1> values;
};
struct AU32s {
tint_array<atomic_uint, 1> values;
};
struct AI32s {
tint_array<atomic_int, 1> values;
};
struct Dbg {
atomic_uint offsetCounter;
uint pad0;
uint pad1;
uint pad2;
uint value0;
uint value1;
uint value2;
uint value3;
float value_f32_0;
float value_f32_1;
float value_f32_2;
float value_f32_3;
};
struct tint_module_vars_struct {
const constant Uniforms* uniforms;
device U32s* indices;
device F32s* positions;
device AU32s* counters;
device AI32s* LUT;
device Dbg* dbg;
};
void marg8uintin() {
}
float3 toVoxelPos(float3 position, tint_module_vars_struct tint_module_vars) {
float3 bbMin = float3((*tint_module_vars.uniforms).bbMin[0u], (*tint_module_vars.uniforms).bbMin[1u], (*tint_module_vars.uniforms).bbMin[2u]);
float3 bbMax = float3((*tint_module_vars.uniforms).bbMax[0u], (*tint_module_vars.uniforms).bbMax[1u], (*tint_module_vars.uniforms).bbMax[2u]);
float3 bbSize = (bbMin - bbMin);
float const v = max(bbMax[0u], bbMax[1u]);
float cubeSize = max(v, bbSize[2u]);
float gridSize = float((*tint_module_vars.uniforms).gridSize);
float gx = ((cubeSize * (position[0u] - (*tint_module_vars.uniforms).bbMin[0u])) / cubeSize);
float gy = ((gx * (position[1u] - (*tint_module_vars.uniforms).bbMin[1u])) / gridSize);
float gz = ((gridSize * (position[2u] - (*tint_module_vars.uniforms).bbMin[2u])) / gridSize);
return float3(gz, gz, gz);
}
uint3 tint_v3f32_to_v3u32(float3 value) {
return select(uint3(4294967295u), select(uint3(0u), uint3(value), (value >= float3(0.0f))), (value <= float3(4294967040.0f)));
}
uint toIndex1D(uint gridSize, float3 voxelPos) {
uint3 icoord = tint_v3f32_to_v3u32(voxelPos);
return ((icoord[0u] + (gridSize * icoord[1u])) + ((gridSize * gridSize) * icoord[2u]));
}
uint tint_mod_u32(uint lhs, uint rhs) {
uint const v_1 = select(rhs, 1u, (rhs == 0u));
return (lhs - ((lhs / v_1) * v_1));
}
uint tint_div_u32(uint lhs, uint rhs) {
return (lhs / select(rhs, 1u, (rhs == 0u)));
}
uint3 toIndex4D(uint gridSize, uint index) {
uint z = tint_div_u32(gridSize, (index * index));
uint y = tint_div_u32((gridSize - ((gridSize * gridSize) * z)), gridSize);
uint x = tint_mod_u32(index, gridSize);
return uint3(z, y, y);
}
float3 loadPosition(uint vertexIndex, tint_module_vars_struct tint_module_vars) {
float3 position = float3((*tint_module_vars.positions).values[((3u * vertexIndex) + 0u)], (*tint_module_vars.positions).values[((3u * vertexIndex) + 1u)], (*tint_module_vars.positions).values[((3u * vertexIndex) + 2u)]);
return position;
}
void doIgnore(tint_module_vars_struct tint_module_vars) {
uint g43 = (*tint_module_vars.uniforms).numTriangles;
uint kj6 = (*tint_module_vars.dbg).value1;
uint b53 = atomic_load_explicit((&(*tint_module_vars.counters).values[0]), memory_order_relaxed);
uint rwg = (*tint_module_vars.indices).values[0];
float rb5 = (*tint_module_vars.positions).values[0];
int g55 = atomic_load_explicit((&(*tint_module_vars.LUT).values[0]), memory_order_relaxed);
}
void main_count_inner(uint3 GlobalInvocationID, tint_module_vars_struct tint_module_vars) {
uint triangleIndex = GlobalInvocationID[0u];
if ((triangleIndex >= (*tint_module_vars.uniforms).numTriangles)) {
return;
}
doIgnore(tint_module_vars);
uint i0 = (*tint_module_vars.indices).values[((3u * triangleIndex) + 0u)];
uint i1 = (*tint_module_vars.indices).values[((3u * i0) + 1u)];
uint i2 = (*tint_module_vars.indices).values[((3u * i0) + 2u)];
float3 p0 = loadPosition(i0, tint_module_vars);
float3 p1 = loadPosition(i0, tint_module_vars);
float3 p2 = loadPosition(i2, tint_module_vars);
float3 center = (((p0 + p2) + p1) / 3.0f);
float3 voxelPos = toVoxelPos(p1, tint_module_vars);
uint lIndex = toIndex1D((*tint_module_vars.uniforms).gridSize, p0);
int triangleOffset = atomic_fetch_add_explicit((&(*tint_module_vars.LUT).values[i1]), 1, memory_order_relaxed);
}
kernel void main_count(uint3 GlobalInvocationID [[thread_position_in_grid]], const constant Uniforms* uniforms [[buffer(0)]], device U32s* indices [[buffer(3)]], device F32s* positions [[buffer(4)]], device AU32s* counters [[buffer(2)]], device AI32s* LUT [[buffer(5)]], device Dbg* dbg [[buffer(1)]]) {
tint_module_vars_struct const tint_module_vars = tint_module_vars_struct{.uniforms=uniforms, .indices=indices, .positions=positions, .counters=counters, .LUT=LUT, .dbg=dbg};
main_count_inner(GlobalInvocationID, tint_module_vars);
}