| #pragma clang diagnostic ignored "-Wmissing-prototypes" |
| |
| #include <metal_stdlib> |
| #include <simd/simd.h> |
| |
| using namespace metal; |
| |
| struct spvAux |
| { |
| uint swizzleConst[1]; |
| }; |
| |
| // Returns 2D texture coords corresponding to 1D texel buffer coords |
| uint2 spvTexelBufferCoord(uint tc) |
| { |
| return uint2(tc % 4096, tc / 4096); |
| } |
| |
| enum class spvSwizzle : uint |
| { |
| none = 0, |
| zero, |
| one, |
| red, |
| green, |
| blue, |
| alpha |
| }; |
| |
| template<typename T> struct spvRemoveReference { typedef T type; }; |
| template<typename T> struct spvRemoveReference<thread T&> { typedef T type; }; |
| template<typename T> struct spvRemoveReference<thread T&&> { typedef T type; }; |
| template<typename T> inline constexpr thread T&& spvForward(thread typename spvRemoveReference<T>::type& x) |
| { |
| return static_cast<thread T&&>(x); |
| } |
| template<typename T> inline constexpr thread T&& spvForward(thread typename spvRemoveReference<T>::type&& x) |
| { |
| return static_cast<thread T&&>(x); |
| } |
| |
| template<typename T> |
| inline T spvGetSwizzle(vec<T, 4> x, T c, spvSwizzle s) |
| { |
| switch (s) |
| { |
| case spvSwizzle::none: |
| return c; |
| case spvSwizzle::zero: |
| return 0; |
| case spvSwizzle::one: |
| return 1; |
| case spvSwizzle::red: |
| return x.r; |
| case spvSwizzle::green: |
| return x.g; |
| case spvSwizzle::blue: |
| return x.b; |
| case spvSwizzle::alpha: |
| return x.a; |
| } |
| } |
| |
| // Wrapper function that swizzles texture samples and fetches. |
| template<typename T> |
| inline vec<T, 4> spvTextureSwizzle(vec<T, 4> x, uint s) |
| { |
| if (!s) |
| return x; |
| return vec<T, 4>(spvGetSwizzle(x, x.r, spvSwizzle((s >> 0) & 0xFF)), spvGetSwizzle(x, x.g, spvSwizzle((s >> 8) & 0xFF)), spvGetSwizzle(x, x.b, spvSwizzle((s >> 16) & 0xFF)), spvGetSwizzle(x, x.a, spvSwizzle((s >> 24) & 0xFF))); |
| } |
| |
| template<typename T> |
| inline T spvTextureSwizzle(T x, uint s) |
| { |
| return spvTextureSwizzle(vec<T, 4>(x, 0, 0, 1), s).x; |
| } |
| |
| // Wrapper function that swizzles texture gathers. |
| template<typename T, typename Tex, typename... Ts> |
| inline vec<T, 4> spvGatherSwizzle(sampler s, thread Tex& t, Ts... params, component c, uint sw) METAL_CONST_ARG(c) |
| { |
| if (sw) |
| { |
| switch (spvSwizzle((sw >> (uint(c) * 8)) & 0xFF)) |
| { |
| case spvSwizzle::none: |
| break; |
| case spvSwizzle::zero: |
| return vec<T, 4>(0, 0, 0, 0); |
| case spvSwizzle::one: |
| return vec<T, 4>(1, 1, 1, 1); |
| case spvSwizzle::red: |
| return t.gather(s, spvForward<Ts>(params)..., component::x); |
| case spvSwizzle::green: |
| return t.gather(s, spvForward<Ts>(params)..., component::y); |
| case spvSwizzle::blue: |
| return t.gather(s, spvForward<Ts>(params)..., component::z); |
| case spvSwizzle::alpha: |
| return t.gather(s, spvForward<Ts>(params)..., component::w); |
| } |
| } |
| switch (c) |
| { |
| case component::x: |
| return t.gather(s, spvForward<Ts>(params)..., component::x); |
| case component::y: |
| return t.gather(s, spvForward<Ts>(params)..., component::y); |
| case component::z: |
| return t.gather(s, spvForward<Ts>(params)..., component::z); |
| case component::w: |
| return t.gather(s, spvForward<Ts>(params)..., component::w); |
| } |
| } |
| |
| // Wrapper function that swizzles depth texture gathers. |
| template<typename T, typename Tex, typename... Ts> |
| inline vec<T, 4> spvGatherCompareSwizzle(sampler s, thread Tex& t, Ts... params, uint sw) |
| { |
| if (sw) |
| { |
| switch (spvSwizzle(sw & 0xFF)) |
| { |
| case spvSwizzle::none: |
| case spvSwizzle::red: |
| break; |
| case spvSwizzle::zero: |
| case spvSwizzle::green: |
| case spvSwizzle::blue: |
| case spvSwizzle::alpha: |
| return vec<T, 4>(0, 0, 0, 0); |
| case spvSwizzle::one: |
| return vec<T, 4>(1, 1, 1, 1); |
| } |
| } |
| return t.gather_compare(s, spvForward<Ts>(params)...); |
| } |
| |
| float4 doSwizzle(thread texture1d<float> tex1d, thread const sampler tex1dSmplr, thread texture2d<float> tex2d, thread const sampler tex2dSmplr, thread texture3d<float> tex3d, thread const sampler tex3dSmplr, thread texturecube<float> texCube, thread const sampler texCubeSmplr, thread texture2d_array<float> tex2dArray, thread const sampler tex2dArraySmplr, thread texturecube_array<float> texCubeArray, thread const sampler texCubeArraySmplr, thread depth2d<float> depth2d, thread const sampler depth2dSmplr, thread depthcube<float> depthCube, thread const sampler depthCubeSmplr, thread depth2d_array<float> depth2dArray, thread const sampler depth2dArraySmplr, thread depthcube_array<float> depthCubeArray, thread const sampler depthCubeArraySmplr, thread texture2d<float> texBuffer, constant spvAux& spvAuxBuffer) |
| { |
| float4 c = spvTextureSwizzle(tex1d.sample(tex1dSmplr, 0.0), spvAuxBuffer.swizzleConst[0]); |
| c = spvTextureSwizzle(tex2d.sample(tex2dSmplr, float2(0.0)), spvAuxBuffer.swizzleConst[1]); |
| c = spvTextureSwizzle(tex3d.sample(tex3dSmplr, float3(0.0)), spvAuxBuffer.swizzleConst[2]); |
| c = spvTextureSwizzle(texCube.sample(texCubeSmplr, float3(0.0)), spvAuxBuffer.swizzleConst[3]); |
| c = spvTextureSwizzle(tex2dArray.sample(tex2dArraySmplr, float3(0.0).xy, uint(round(float3(0.0).z))), spvAuxBuffer.swizzleConst[4]); |
| c = spvTextureSwizzle(texCubeArray.sample(texCubeArraySmplr, float4(0.0).xyz, uint(round(float4(0.0).w))), spvAuxBuffer.swizzleConst[5]); |
| c.x = spvTextureSwizzle(depth2d.sample_compare(depth2dSmplr, float3(0.0, 0.0, 1.0).xy, float3(0.0, 0.0, 1.0).z), spvAuxBuffer.swizzleConst[7]); |
| c.x = spvTextureSwizzle(depthCube.sample_compare(depthCubeSmplr, float4(0.0, 0.0, 0.0, 1.0).xyz, float4(0.0, 0.0, 0.0, 1.0).w), spvAuxBuffer.swizzleConst[8]); |
| c.x = spvTextureSwizzle(depth2dArray.sample_compare(depth2dArraySmplr, float4(0.0, 0.0, 0.0, 1.0).xy, uint(round(float4(0.0, 0.0, 0.0, 1.0).z)), float4(0.0, 0.0, 0.0, 1.0).w), spvAuxBuffer.swizzleConst[9]); |
| c.x = spvTextureSwizzle(depthCubeArray.sample_compare(depthCubeArraySmplr, float4(0.0).xyz, uint(round(float4(0.0).w)), 1.0), spvAuxBuffer.swizzleConst[10]); |
| c = spvTextureSwizzle(tex1d.sample(tex1dSmplr, float2(0.0, 1.0).x / float2(0.0, 1.0).y), spvAuxBuffer.swizzleConst[0]); |
| c = spvTextureSwizzle(tex2d.sample(tex2dSmplr, float3(0.0, 0.0, 1.0).xy / float3(0.0, 0.0, 1.0).z), spvAuxBuffer.swizzleConst[1]); |
| c = spvTextureSwizzle(tex3d.sample(tex3dSmplr, float4(0.0, 0.0, 0.0, 1.0).xyz / float4(0.0, 0.0, 0.0, 1.0).w), spvAuxBuffer.swizzleConst[2]); |
| float4 _103 = float4(0.0, 0.0, 1.0, 1.0); |
| _103.z = float4(0.0, 0.0, 1.0, 1.0).w; |
| c.x = spvTextureSwizzle(depth2d.sample_compare(depth2dSmplr, _103.xy / _103.z, float4(0.0, 0.0, 1.0, 1.0).z), spvAuxBuffer.swizzleConst[7]); |
| c = spvTextureSwizzle(tex1d.sample(tex1dSmplr, 0.0), spvAuxBuffer.swizzleConst[0]); |
| c = spvTextureSwizzle(tex2d.sample(tex2dSmplr, float2(0.0), level(0.0)), spvAuxBuffer.swizzleConst[1]); |
| c = spvTextureSwizzle(tex3d.sample(tex3dSmplr, float3(0.0), level(0.0)), spvAuxBuffer.swizzleConst[2]); |
| c = spvTextureSwizzle(texCube.sample(texCubeSmplr, float3(0.0), level(0.0)), spvAuxBuffer.swizzleConst[3]); |
| c = spvTextureSwizzle(tex2dArray.sample(tex2dArraySmplr, float3(0.0).xy, uint(round(float3(0.0).z)), level(0.0)), spvAuxBuffer.swizzleConst[4]); |
| c = spvTextureSwizzle(texCubeArray.sample(texCubeArraySmplr, float4(0.0).xyz, uint(round(float4(0.0).w)), level(0.0)), spvAuxBuffer.swizzleConst[5]); |
| c.x = spvTextureSwizzle(depth2d.sample_compare(depth2dSmplr, float3(0.0, 0.0, 1.0).xy, float3(0.0, 0.0, 1.0).z, level(0.0)), spvAuxBuffer.swizzleConst[7]); |
| c = spvTextureSwizzle(tex1d.sample(tex1dSmplr, float2(0.0, 1.0).x / float2(0.0, 1.0).y), spvAuxBuffer.swizzleConst[0]); |
| c = spvTextureSwizzle(tex2d.sample(tex2dSmplr, float3(0.0, 0.0, 1.0).xy / float3(0.0, 0.0, 1.0).z, level(0.0)), spvAuxBuffer.swizzleConst[1]); |
| c = spvTextureSwizzle(tex3d.sample(tex3dSmplr, float4(0.0, 0.0, 0.0, 1.0).xyz / float4(0.0, 0.0, 0.0, 1.0).w, level(0.0)), spvAuxBuffer.swizzleConst[2]); |
| float4 _131 = float4(0.0, 0.0, 1.0, 1.0); |
| _131.z = float4(0.0, 0.0, 1.0, 1.0).w; |
| c.x = spvTextureSwizzle(depth2d.sample_compare(depth2dSmplr, _131.xy / _131.z, float4(0.0, 0.0, 1.0, 1.0).z, level(0.0)), spvAuxBuffer.swizzleConst[7]); |
| c = spvTextureSwizzle(tex1d.read(uint(0)), spvAuxBuffer.swizzleConst[0]); |
| c = spvTextureSwizzle(tex2d.read(uint2(int2(0)), 0), spvAuxBuffer.swizzleConst[1]); |
| c = spvTextureSwizzle(tex3d.read(uint3(int3(0)), 0), spvAuxBuffer.swizzleConst[2]); |
| c = spvTextureSwizzle(tex2dArray.read(uint2(int3(0).xy), uint(int3(0).z), 0), spvAuxBuffer.swizzleConst[4]); |
| c = texBuffer.read(spvTexelBufferCoord(0)); |
| c = spvGatherSwizzle<float, metal::texture2d<float>, float2, int2>(tex2dSmplr, tex2d, float2(0.0), int2(0), component::x, spvAuxBuffer.swizzleConst[1]); |
| c = spvGatherSwizzle<float, metal::texturecube<float>, float3>(texCubeSmplr, texCube, float3(0.0), component::y, spvAuxBuffer.swizzleConst[3]); |
| c = spvGatherSwizzle<float, metal::texture2d_array<float>, float2, uint, int2>(tex2dArraySmplr, tex2dArray, float3(0.0).xy, uint(round(float3(0.0).z)), int2(0), component::z, spvAuxBuffer.swizzleConst[4]); |
| c = spvGatherSwizzle<float, metal::texturecube_array<float>, float3, uint>(texCubeArraySmplr, texCubeArray, float4(0.0).xyz, uint(round(float4(0.0).w)), component::w, spvAuxBuffer.swizzleConst[5]); |
| c = spvGatherCompareSwizzle<float, metal::depth2d<float>, float2, float>(depth2dSmplr, depth2d, float2(0.0), 1.0, spvAuxBuffer.swizzleConst[7]); |
| c = spvGatherCompareSwizzle<float, metal::depthcube<float>, float3, float>(depthCubeSmplr, depthCube, float3(0.0), 1.0, spvAuxBuffer.swizzleConst[8]); |
| c = spvGatherCompareSwizzle<float, metal::depth2d_array<float>, float2, uint, float>(depth2dArraySmplr, depth2dArray, float3(0.0).xy, uint(round(float3(0.0).z)), 1.0, spvAuxBuffer.swizzleConst[9]); |
| c = spvGatherCompareSwizzle<float, metal::depthcube_array<float>, float3, uint, float>(depthCubeArraySmplr, depthCubeArray, float4(0.0).xyz, uint(round(float4(0.0).w)), 1.0, spvAuxBuffer.swizzleConst[10]); |
| return c; |
| } |
| |
| fragment void main0(constant spvAux& spvAuxBuffer [[buffer(0)]], texture1d<float> tex1d [[texture(0)]], texture2d<float> tex2d [[texture(1)]], texture3d<float> tex3d [[texture(2)]], texturecube<float> texCube [[texture(3)]], texture2d_array<float> tex2dArray [[texture(4)]], texturecube_array<float> texCubeArray [[texture(5)]], texture2d<float> texBuffer [[texture(6)]], depth2d<float> depth2d [[texture(7)]], depthcube<float> depthCube [[texture(8)]], depth2d_array<float> depth2dArray [[texture(9)]], depthcube_array<float> depthCubeArray [[texture(10)]], sampler tex1dSmplr [[sampler(0)]], sampler tex2dSmplr [[sampler(1)]], sampler tex3dSmplr [[sampler(2)]], sampler texCubeSmplr [[sampler(3)]], sampler tex2dArraySmplr [[sampler(4)]], sampler texCubeArraySmplr [[sampler(5)]], sampler depth2dSmplr [[sampler(7)]], sampler depthCubeSmplr [[sampler(8)]], sampler depth2dArraySmplr [[sampler(9)]], sampler depthCubeArraySmplr [[sampler(10)]]) |
| { |
| float4 c = doSwizzle(tex1d, tex1dSmplr, tex2d, tex2dSmplr, tex3d, tex3dSmplr, texCube, texCubeSmplr, tex2dArray, tex2dArraySmplr, texCubeArray, texCubeArraySmplr, depth2d, depth2dSmplr, depthCube, depthCubeSmplr, depth2dArray, depth2dArraySmplr, depthCubeArray, depthCubeArraySmplr, texBuffer, spvAuxBuffer); |
| } |
| |