| cbuffer cbuffer_a : register(b0) { |
| uint4 a[12]; |
| }; |
| RWByteAddressBuffer s : register(u1); |
| static int counter = 0; |
| |
| int i() { |
| counter = (counter + 1); |
| return counter; |
| } |
| |
| float3x4 a_load_1(uint offset) { |
| const uint scalar_offset = ((offset + 0u)) / 4; |
| const uint scalar_offset_1 = ((offset + 16u)) / 4; |
| const uint scalar_offset_2 = ((offset + 32u)) / 4; |
| return float3x4(asfloat(a[scalar_offset / 4]), asfloat(a[scalar_offset_1 / 4]), asfloat(a[scalar_offset_2 / 4])); |
| } |
| |
| typedef float3x4 a_load_ret[4]; |
| a_load_ret a_load(uint offset) { |
| float3x4 arr[4] = (float3x4[4])0; |
| { |
| for(uint i_1 = 0u; (i_1 < 4u); i_1 = (i_1 + 1u)) { |
| arr[i_1] = a_load_1((offset + (i_1 * 48u))); |
| } |
| } |
| return arr; |
| } |
| |
| [numthreads(1, 1, 1)] |
| void f() { |
| int p_a_i_save = i(); |
| int p_a_i_i_save = i(); |
| float3x4 l_a[4] = a_load(0u); |
| float3x4 l_a_i = a_load_1((48u * uint(p_a_i_save))); |
| const uint scalar_offset_3 = (((48u * uint(p_a_i_save)) + (16u * uint(p_a_i_i_save)))) / 4; |
| float4 l_a_i_i = asfloat(a[scalar_offset_3 / 4]); |
| const uint scalar_offset_4 = (((48u * uint(p_a_i_save)) + (16u * uint(p_a_i_i_save)))) / 4; |
| s.Store(0u, asuint((((asfloat(a[scalar_offset_4 / 4][scalar_offset_4 % 4]) + l_a[0][0].x) + l_a_i[0].x) + l_a_i_i.x))); |
| return; |
| } |