Jam
/
GGJ_2019


								// Upgrade NOTE: replaced 'mul(UNITY_MATRIX_MVP,*)' with 'UnityObjectToClipPos(*)'


								// Copyright (c) <2015> <Playdead>

								// This file is subject to the MIT License as seen in the root of this folder structure (LICENSE.TXT)

								// AUTHOR: Lasse Jon Fuglsang Pedersen <lasse@playdead.com>


								Shader "Hidden/TAA"

								{

									Properties

									{

										_MainTex ("Base (RGB)", 2D) = "white" {}

									}


									CGINCLUDE

									//--- program begin


									#pragma only_renderers ps4 xboxone d3d11 d3d9 xbox360 opengl glcore gles3 metal vulkan

									#pragma target 3.0


									#pragma multi_compile CAMERA_PERSPECTIVE CAMERA_ORTHOGRAPHIC

									#pragma multi_compile MINMAX_3X3 MINMAX_3X3_ROUNDED MINMAX_4TAP_VARYING

									#pragma multi_compile __ UNJITTER_COLORSAMPLES

									#pragma multi_compile __ UNJITTER_NEIGHBORHOOD

									#pragma multi_compile __ UNJITTER_REPROJECTION

									#pragma multi_compile __ USE_YCOCG

									#pragma multi_compile __ USE_CLIPPING

									#pragma multi_compile __ USE_DILATION

									#pragma multi_compile __ USE_MOTION_BLUR

									#pragma multi_compile __ USE_MOTION_BLUR_NEIGHBORMAX

									#pragma multi_compile __ USE_OPTIMIZATIONS


									#include "UnityCG.cginc"

									#include "IncDepth.cginc"

									#include "IncNoise.cginc"


								#if SHADER_API_MOBILE

									static const float FLT_EPS = 0.0001f;

								#else

									static const float FLT_EPS = 0.00000001f;

								#endif


									uniform float4 _JitterUV;// frustum jitter uv deltas, where xy = current frame, zw = previous


									uniform sampler2D _MainTex;

									uniform float4 _MainTex_TexelSize;


									uniform sampler2D_half _VelocityBuffer;

									uniform sampler2D _VelocityNeighborMax;


									uniform sampler2D _PrevTex;

									uniform float _FeedbackMin;

									uniform float _FeedbackMax;

									uniform float _MotionScale;


									struct v2f

									{

										float4 cs_pos : SV_POSITION;

										float2 ss_txc : TEXCOORD0;

									};


									v2f vert(appdata_img IN)

									{

										v2f OUT;


									#if UNITY_VERSION < 540

										OUT.cs_pos = UnityObjectToClipPos(IN.vertex);

									#else

										OUT.cs_pos = UnityObjectToClipPos(IN.vertex);

									#endif

									#if UNITY_SINGLE_PASS_STEREO

										OUT.ss_txc = UnityStereoTransformScreenSpaceTex(IN.texcoord.xy);

									#else

										OUT.ss_txc = IN.texcoord.xy;

									#endif


										return OUT;

									}


									// https://software.intel.com/en-us/node/503873

									float3 RGB_YCoCg(float3 c)

									{

										// Y = R/4 + G/2 + B/4

										// Co = R/2 - B/2

										// Cg = -R/4 + G/2 - B/4

										return float3(

											 c.x/4.0 + c.y/2.0 + c.z/4.0,

											 c.x/2.0 - c.z/2.0,

											-c.x/4.0 + c.y/2.0 - c.z/4.0

										);

									}


									// https://software.intel.com/en-us/node/503873

									float3 YCoCg_RGB(float3 c)

									{

										// R = Y + Co - Cg

										// G = Y + Cg

										// B = Y - Co - Cg

										return saturate(float3(

											c.x + c.y - c.z,

											c.x + c.z,

											c.x - c.y - c.z

										));

									}


									float4 sample_color(sampler2D tex, float2 uv)

									{

									#if USE_YCOCG

										float4 c = tex2D(tex, uv);

										return float4(RGB_YCoCg(c.rgb), c.a);

									#else

										return tex2D(tex, uv);

									#endif

									}


									float4 resolve_color(float4 c)

									{

									#if USE_YCOCG

										return float4(YCoCg_RGB(c.rgb).rgb, c.a);

									#else

										return c;

									#endif

									}


									float4 clip_aabb(float3 aabb_min, float3 aabb_max, float4 p, float4 q)

									{

									#if USE_OPTIMIZATIONS

										// note: only clips towards aabb center (but fast!)

										float3 p_clip = 0.5 * (aabb_max + aabb_min);

										float3 e_clip = 0.5 * (aabb_max - aabb_min) + FLT_EPS;


										float4 v_clip = q - float4(p_clip, p.w);

										float3 v_unit = v_clip.xyz / e_clip;

										float3 a_unit = abs(v_unit);

										float ma_unit = max(a_unit.x, max(a_unit.y, a_unit.z));


										if (ma_unit > 1.0)

											return float4(p_clip, p.w) + v_clip / ma_unit;

										else

											return q;// point inside aabb

									#else

										float4 r = q - p;

										float3 rmax = aabb_max - p.xyz;

										float3 rmin = aabb_min - p.xyz;


										const float eps = FLT_EPS;


										if (r.x > rmax.x + eps)

											r *= (rmax.x / r.x);

										if (r.y > rmax.y + eps)

											r *= (rmax.y / r.y);

										if (r.z > rmax.z + eps)

											r *= (rmax.z / r.z);


										if (r.x < rmin.x - eps)

											r *= (rmin.x / r.x);

										if (r.y < rmin.y - eps)

											r *= (rmin.y / r.y);

										if (r.z < rmin.z - eps)

											r *= (rmin.z / r.z);


										return p + r;

									#endif

									}


									float2 sample_velocity_dilated(sampler2D tex, float2 uv, int support)

									{

										float2 du = float2(_MainTex_TexelSize.x, 0.0);

										float2 dv = float2(0.0, _MainTex_TexelSize.y);

										float2 mv = 0.0;

										float rmv = 0.0;


										int end = support + 1;

										for (int i = -support; i != end; i++)

										{

											for (int j = -support; j != end; j++)

											{

												float2 v = tex2D(tex, uv + i * dv + j * du).xy;

												float rv = dot(v, v);

												if (rv > rmv)

												{

													mv = v;

													rmv = rv;

												}

											}

										}


										return mv;

									}


									float4 sample_color_motion(sampler2D tex, float2 uv, float2 ss_vel)

									{

										const float2 v = 0.5 * ss_vel;

										const int taps = 3;// on either side!


										float srand = PDsrand(uv + _SinTime.xx);

										float2 vtap = v / taps;

										float2 pos0 = uv + vtap * (0.5 * srand);

										float4 accu = 0.0;

										float wsum = 0.0;


										[unroll]

										for (int i = -taps; i <= taps; i++)

										{

											float w = 1.0;// box

											//float w = taps - abs(i) + 1;// triangle

											//float w = 1.0 / (1 + abs(i));// pointy triangle

											accu += w * sample_color(tex, pos0 + i * vtap);

											wsum += w;

										}


										return accu / wsum;

									}


									float4 temporal_reprojection(float2 ss_txc, float2 ss_vel, float vs_dist)

									{

										// read texels

									#if UNJITTER_COLORSAMPLES

										float4 texel0 = sample_color(_MainTex, ss_txc - _JitterUV.xy);

									#else

										float4 texel0 = sample_color(_MainTex, ss_txc);

									#endif

										float4 texel1 = sample_color(_PrevTex, ss_txc - ss_vel);


										// calc min-max of current neighbourhood

									#if UNJITTER_NEIGHBORHOOD

										float2 uv = ss_txc - _JitterUV.xy;

									#else

										float2 uv = ss_txc;

									#endif


									#if MINMAX_3X3 || MINMAX_3X3_ROUNDED


										float2 du = float2(_MainTex_TexelSize.x, 0.0);

										float2 dv = float2(0.0, _MainTex_TexelSize.y);


										float4 ctl = sample_color(_MainTex, uv - dv - du);

										float4 ctc = sample_color(_MainTex, uv - dv);

										float4 ctr = sample_color(_MainTex, uv - dv + du);

										float4 cml = sample_color(_MainTex, uv - du);

										float4 cmc = sample_color(_MainTex, uv);

										float4 cmr = sample_color(_MainTex, uv + du);

										float4 cbl = sample_color(_MainTex, uv + dv - du);

										float4 cbc = sample_color(_MainTex, uv + dv);

										float4 cbr = sample_color(_MainTex, uv + dv + du);


										float4 cmin = min(ctl, min(ctc, min(ctr, min(cml, min(cmc, min(cmr, min(cbl, min(cbc, cbr))))))));

										float4 cmax = max(ctl, max(ctc, max(ctr, max(cml, max(cmc, max(cmr, max(cbl, max(cbc, cbr))))))));


										#if MINMAX_3X3_ROUNDED || USE_YCOCG || USE_CLIPPING

											float4 cavg = (ctl + ctc + ctr + cml + cmc + cmr + cbl + cbc + cbr) / 9.0;

										#endif


										#if MINMAX_3X3_ROUNDED

											float4 cmin5 = min(ctc, min(cml, min(cmc, min(cmr, cbc))));

											float4 cmax5 = max(ctc, max(cml, max(cmc, max(cmr, cbc))));

											float4 cavg5 = (ctc + cml + cmc + cmr + cbc) / 5.0;

											cmin = 0.5 * (cmin + cmin5);

											cmax = 0.5 * (cmax + cmax5);

											cavg = 0.5 * (cavg + cavg5);

										#endif


									#elif MINMAX_4TAP_VARYING// this is the method used in v2 (PDTemporalReprojection2)


										const float _SubpixelThreshold = 0.5;

										const float _GatherBase = 0.5;

										const float _GatherSubpixelMotion = 0.1666;


										float2 texel_vel = ss_vel / _MainTex_TexelSize.xy;

										float texel_vel_mag = length(texel_vel) * vs_dist;

										float k_subpixel_motion = saturate(_SubpixelThreshold / (FLT_EPS + texel_vel_mag));

										float k_min_max_support = _GatherBase + _GatherSubpixelMotion * k_subpixel_motion;


										float2 ss_offset01 = k_min_max_support * float2(-_MainTex_TexelSize.x, _MainTex_TexelSize.y);

										float2 ss_offset11 = k_min_max_support * float2(_MainTex_TexelSize.x, _MainTex_TexelSize.y);

										float4 c00 = sample_color(_MainTex, uv - ss_offset11);

										float4 c10 = sample_color(_MainTex, uv - ss_offset01);

										float4 c01 = sample_color(_MainTex, uv + ss_offset01);

										float4 c11 = sample_color(_MainTex, uv + ss_offset11);


										float4 cmin = min(c00, min(c10, min(c01, c11)));

										float4 cmax = max(c00, max(c10, max(c01, c11)));


										#if USE_YCOCG || USE_CLIPPING

											float4 cavg = (c00 + c10 + c01 + c11) / 4.0;

										#endif


									#else

										#error "missing keyword MINMAX_..."

									#endif


										// shrink chroma min-max

									#if USE_YCOCG

										float2 chroma_extent = 0.25 * 0.5 * (cmax.r - cmin.r);

										float2 chroma_center = texel0.gb;

										cmin.yz = chroma_center - chroma_extent;

										cmax.yz = chroma_center + chroma_extent;

										cavg.yz = chroma_center;

									#endif


										// clamp to neighbourhood of current sample

									#if USE_CLIPPING

										texel1 = clip_aabb(cmin.xyz, cmax.xyz, clamp(cavg, cmin, cmax), texel1);

									#else

										texel1 = clamp(texel1, cmin, cmax);

									#endif


										// feedback weight from unbiased luminance diff (t.lottes)

									#if USE_YCOCG

										float lum0 = texel0.r;

										float lum1 = texel1.r;

									#else

										float lum0 = Luminance(texel0.rgb);

										float lum1 = Luminance(texel1.rgb);

									#endif

										float unbiased_diff = abs(lum0 - lum1) / max(lum0, max(lum1, 0.2));

										float unbiased_weight = 1.0 - unbiased_diff;

										float unbiased_weight_sqr = unbiased_weight * unbiased_weight;

										float k_feedback = lerp(_FeedbackMin, _FeedbackMax, unbiased_weight_sqr);


										// output

										return lerp(texel0, texel1, k_feedback);

									}


									struct f2rt

									{

										fixed4 buffer : SV_Target0;

										fixed4 screen : SV_Target1;

									};


									f2rt frag(v2f IN)

									{

										f2rt OUT;


									#if UNJITTER_REPROJECTION

										float2 uv = IN.ss_txc - _JitterUV.xy;

									#else

										float2 uv = IN.ss_txc;

									#endif


									#if USE_DILATION

										//--- 3x3 norm (sucks)

										//float2 ss_vel = sample_velocity_dilated(_VelocityBuffer, uv, 1);

										//float vs_dist = depth_sample_linear(uv);


										//--- 5 tap nearest (decent)

										//float3 c_frag = find_closest_fragment_5tap(uv);

										//float2 ss_vel = tex2D(_VelocityBuffer, c_frag.xy).xy;

										//float vs_dist = depth_resolve_linear(c_frag.z);


										//--- 3x3 nearest (good)

										float3 c_frag = find_closest_fragment_3x3(uv);

										float2 ss_vel = tex2D(_VelocityBuffer, c_frag.xy).xy;

										float vs_dist = depth_resolve_linear(c_frag.z);

									#else

										float2 ss_vel = tex2D(_VelocityBuffer, uv).xy;

										float vs_dist = depth_sample_linear(uv);

									#endif


										// temporal resolve

										float4 color_temporal = temporal_reprojection(IN.ss_txc, ss_vel, vs_dist);


										// prepare outputs

										float4 to_buffer = resolve_color(color_temporal);


									#if USE_MOTION_BLUR

										#if USE_MOTION_BLUR_NEIGHBORMAX

											ss_vel = _MotionScale * tex2D(_VelocityNeighborMax, IN.ss_txc).xy;

										#else

											ss_vel = _MotionScale * ss_vel;

										#endif


										float vel_mag = length(ss_vel * _MainTex_TexelSize.zw);

										const float vel_trust_full = 2.0;

										const float vel_trust_none = 15.0;

										const float vel_trust_span = vel_trust_none - vel_trust_full;

										float trust = 1.0 - clamp(vel_mag - vel_trust_full, 0.0, vel_trust_span) / vel_trust_span;


										#if UNJITTER_COLORSAMPLES

											float4 color_motion = sample_color_motion(_MainTex, IN.ss_txc - _JitterUV.xy, ss_vel);

										#else

											float4 color_motion = sample_color_motion(_MainTex, IN.ss_txc, ss_vel);

										#endif


										float4 to_screen = resolve_color(lerp(color_motion, color_temporal, trust));

									#else

										float4 to_screen = resolve_color(color_temporal);

									#endif


										//// NOTE: velocity debug

										//to_screen.g += 100.0 * length(ss_vel);

										//to_screen = float4(100.0 * abs(ss_vel), 0.0, 0.0);


										// add noise

										float4 noise4 = PDsrand4(IN.ss_txc + _SinTime.x + 0.6959174) / 510.0;

										OUT.buffer = saturate(to_buffer /*+ noise4*/);

										//OUT.screen = saturate(to_screen + noise4);

										OUT.screen = saturate(to_screen /*+ noise4*/)/* * float4(1,.2,0,1)*/;

										//OUT.screen = float4(vs_dist, vs_dist, vs_dist,1);

										// done

										return OUT;

									}


									//--- program end

									ENDCG


									SubShader

									{

										ZTest Always Cull Off ZWrite Off

										Fog { Mode off }


										Pass

										{

											CGPROGRAM


											#pragma vertex vert

											#pragma fragment frag


											ENDCG

										}

									}


									Fallback off

								}