slang-shaders/xbr/shaders/xbr-mlv4-multipass/xbr-mlv4-pass1.slang

335 lines
15 KiB
Plaintext

#version 450
/*
Hyllian's xBR MultiLevel4 Shader - Pass1
Copyright (C) 2011-2015 Hyllian - sergiogdb@gmail.com
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:
The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
*/
layout(push_constant) uniform Push
{
vec4 SourceSize;
vec4 OriginalSize;
vec4 OutputSize;
uint FrameCount;
} params;
layout(std140, set = 0, binding = 0) uniform UBO
{
mat4 MVP;
} global;
#define round(X) floor((X)+0.5)
#define TEX(dx,dy) texture(Source, vTexCoord+vec2((dx),(dy))*t1).rgb
#define mul(a,b) (b*a)
const float cf2 = 2.0;
const float cf3 = 4.0;
const float cf4 = 4.0;
const vec4 eq_thresholdold = vec4(15.0, 15.0, 15.0, 15.0);
const vec4 eq_threshold = vec4( 2.0, 2.0, 2.0, 2.0);
const vec4 eq_threshold3 = vec4(25.0, 25.0, 25.0, 25.0);
const vec3 Yuv_weight = vec3(4.0, 1.0, 2.0);
const mat3 yuv = mat3(0.299, 0.587, 0.114, -0.169, -0.331, 0.499, 0.499, -0.418, -0.0813);
const mat3 yuvT = mat3(0.299, -0.169, 0.499, 0.587, -0.331, -0.418, 0.114, 0.499, -0.0813);
const vec4 maximo = vec4(255.0, 255.0, 255.0, 255.0);
vec4 df(vec4 A, vec4 B)
{
return vec4(abs(A-B));
}
bvec4 rd(vec4 A, vec4 B, vec4 C, vec4 D)
{
return (greaterThan(df(C,D)/(df(A,B)+0.000000001) , vec4(2.0)));
}
bvec4 id(vec4 A, vec4 B, vec4 C, vec4 D)
{
return greaterThan(df(C,D) , df(A,B));
}
vec4 remapTo01(vec4 v, vec4 high)
{
return (v/high);
}
bvec4 eq(vec4 A, vec4 B)
{
return lessThan(df(A, B) , eq_threshold);
}
bvec4 eq3(vec4 A, vec4 B)
{
return lessThan(df(A, B) , eq_threshold3);
}
vec4 weighted_distance(vec4 a, vec4 b, vec4 c, vec4 d, vec4 e, vec4 f, vec4 g, vec4 h)
{
return (df(a,b) + df(a,c) + df(d,e) + df(d,f) + 4.0*df(g,h));
}
bvec4 and(bvec4 A, bvec4 B)
{
return bvec4(A.x && B.x, A.y && B.y, A.z && B.z, A.w && B.w);
}
bvec4 or(bvec4 A, bvec4 B)
{
return bvec4(A.x || B.x, A.y || B.y, A.z || B.z, A.w || B.w);
}
#pragma stage vertex
layout(location = 0) in vec4 Position;
layout(location = 1) in vec2 TexCoord;
layout(location = 0) out vec2 vTexCoord;
layout(location = 1) out vec2 t1;
void main()
{
gl_Position = global.MVP * Position;
vTexCoord = TexCoord * 1.0004;
// A3 B3 C3
// A1 B1 C1
//A2 A0 A B C C4 C6
//D2 D0 D E F F4 F6
//G2 G0 G H I I4 I6
// G5 H5 I5
// G7 H7 I7
t1 = vec2(params.SourceSize.z, params.SourceSize.w); // F H
}
#pragma stage fragment
layout(location = 0) in vec2 vTexCoord;
layout(location = 1) in vec2 t1;
layout(location = 0) out vec4 FragColor;
layout(set = 0, binding = 2) uniform sampler2D Source;
void main()
{
bvec4 edr0, edr, edr_left, edr_up, edr3_left, edr3_up, edr4_left, edr4_up; // edr = edge detection rule
bvec4 interp_restriction_lv1, interp_restriction_lv2_left, interp_restriction_lv2_up;
bvec4 interp_restriction_lv3_left, interp_restriction_lv3_up;
bvec4 interp_restriction_lv4_left, interp_restriction_lv4_up;
vec3 A3 = TEX(-1,-3); vec3 B3 = TEX( 0,-3); vec3 C3 = TEX( 1,-3);
vec3 A1 = TEX(-1,-2); vec3 B1 = TEX( 0,-2); vec3 C1 = TEX( 1,-2);
vec3 A2 = TEX(-3,-1); vec3 A0 = TEX(-2,-1); vec3 A = TEX(-1,-1); vec3 B = TEX( 0,-1); vec3 C = TEX( 1,-1); vec3 C4 = TEX( 2,-1); vec3 C6 = TEX( 3,-1);
vec3 D2 = TEX(-3, 0); vec3 D0 = TEX(-2, 0); vec3 D = TEX(-1, 0); vec3 E = TEX( 0, 0); vec3 F = TEX( 1, 0); vec3 F4 = TEX( 2, 0); vec3 F6 = TEX( 3, 0);
vec3 G2 = TEX(-3, 1); vec3 G0 = TEX(-2, 1); vec3 G = TEX(-1, 1); vec3 H = TEX( 0, 1); vec3 I = TEX( 1, 1); vec3 I4 = TEX( 2, 1); vec3 I6 = TEX( 3, 1);
vec3 G5 = TEX(-1, 2); vec3 H5 = TEX( 0, 2); vec3 I5 = TEX( 1, 2);
vec3 G7 = TEX(-1, 3); vec3 H7 = TEX( 0, 3); vec3 I7 = TEX( 1, 3);
mat4x3 bdhf = mul( mat4x3(B, D, H, F), yuvT );
bdhf = mat4x3(abs(bdhf[0]), abs(bdhf[1]), abs(bdhf[2]), abs(bdhf[3]));
vec4 b = mul( bdhf, Yuv_weight);
bdhf = mul( mat4x3(C, A, G, I), yuvT );
bdhf = mat4x3(abs(bdhf[0]), abs(bdhf[1]), abs(bdhf[2]), abs(bdhf[3]));
vec4 c = mul( bdhf, Yuv_weight);
bdhf = mul( mat4x3(E, E, E, E), yuvT );
bdhf = mat4x3(abs(bdhf[0]), abs(bdhf[1]), abs(bdhf[2]), abs(bdhf[3]));
vec4 e = mul( bdhf, Yuv_weight);
vec4 d = b.yzwx;
vec4 f = b.wxyz;
vec4 g = c.zwxy;
vec4 h = b.zwxy;
vec4 i = c.wxyz;
bdhf = mul( mat4x3(I4, C1, A0, G5), yuvT );
bdhf = mat4x3(abs(bdhf[0]), abs(bdhf[1]), abs(bdhf[2]), abs(bdhf[3]));
vec4 i4 = mul( bdhf, Yuv_weight);
bdhf = mul( mat4x3(I5, C4, A1, G0), yuvT );
bdhf = mat4x3(abs(bdhf[0]), abs(bdhf[1]), abs(bdhf[2]), abs(bdhf[3]));
vec4 i5 = mul( bdhf, Yuv_weight);
bdhf = mul( mat4x3(H5, F4, B1, D0), yuvT );
bdhf = mat4x3(abs(bdhf[0]), abs(bdhf[1]), abs(bdhf[2]), abs(bdhf[3]));
vec4 h5 = mul( bdhf, Yuv_weight);
vec4 f4 = h5.yzwx;
vec4 c1 = i4.yzwx;
vec4 g0 = i5.wxyz;
vec4 b1 = h5.zwxy;
vec4 d0 = h5.wxyz;
bdhf = mul( mat4x3(I6, C3, A2, G7), yuvT );
bdhf = mat4x3(abs(bdhf[0]), abs(bdhf[1]), abs(bdhf[2]), abs(bdhf[3]));
vec4 i6 = mul( bdhf, Yuv_weight);
bdhf = mul( mat4x3(I7, C6, A3, G2), yuvT );
bdhf = mat4x3(abs(bdhf[0]), abs(bdhf[1]), abs(bdhf[2]), abs(bdhf[3]));
vec4 i7 = mul( bdhf, Yuv_weight);
bdhf = mul( mat4x3(H7, F6, B3, D2), yuvT );
bdhf = mat4x3(abs(bdhf[0]), abs(bdhf[1]), abs(bdhf[2]), abs(bdhf[3]));
vec4 h7 = mul( bdhf, Yuv_weight);
vec4 f6 = h7.yzwx;
vec4 c3 = i6.yzwx;
vec4 g2 = i7.wxyz;
vec4 b3 = h7.zwxy;
vec4 d2 = h7.wxyz;
//groan, gotta separate these into their components???
interp_restriction_lv1.x = !(e.x==f.x) && !(e.x==h.x);
interp_restriction_lv1.y = !(e.y==f.y) && !(e.y==h.y);
interp_restriction_lv1.z = !(e.z==f.z) && !(e.z==h.z);
interp_restriction_lv1.w = !(e.w==f.w) && !(e.w==h.w);
interp_restriction_lv2_left.x = (e.x!=g.x && d.x!=g.x && (eq(e, d).x || eq(h, g).x));
interp_restriction_lv2_left.y = (e.y!=g.y && d.y!=g.y && (eq(e, d).y || eq(h, g).y));
interp_restriction_lv2_left.z = (e.z!=g.z && d.z!=g.z && (eq(e, d).z || eq(h, g).z));
interp_restriction_lv2_left.w = (e.w!=g.w && d.w!=g.w && (eq(e, d).w || eq(h, g).w));
interp_restriction_lv2_up.x = (e.x!=c.x && b.x!=c.x && (eq(e, b).x || eq(f, c).x));
interp_restriction_lv2_up.y = (e.y!=c.y && b.y!=c.y && (eq(e, b).y || eq(f, c).y));
interp_restriction_lv2_up.z = (e.z!=c.z && b.z!=c.z && (eq(e, b).z || eq(f, c).z));
interp_restriction_lv2_up.w = (e.w!=c.w && b.w!=c.w && (eq(e, b).w || eq(f, c).w));
interp_restriction_lv3_left.x = (e.x!=g0.x && d0.x!=g0.x && (eq(d,d0).x || eq(g,g0).x));
interp_restriction_lv3_left.y = (e.y!=g0.y && d0.y!=g0.y && (eq(d,d0).y || eq(g,g0).y));
interp_restriction_lv3_left.z = (e.z!=g0.z && d0.z!=g0.z && (eq(d,d0).z || eq(g,g0).z));
interp_restriction_lv3_left.w = (e.w!=g0.w && d0.w!=g0.w && (eq(d,d0).w || eq(g,g0).w));
interp_restriction_lv3_up.x = (e.x!=c1.x && b1.x!=c1.x && (eq(b,b1).x || eq(c,c1).x));
interp_restriction_lv3_up.y = (e.y!=c1.y && b1.y!=c1.y && (eq(b,b1).y || eq(c,c1).y));
interp_restriction_lv3_up.z = (e.z!=c1.z && b1.z!=c1.z && (eq(b,b1).z || eq(c,c1).z));
interp_restriction_lv3_up.w = (e.w!=c1.w && b1.w!=c1.w && (eq(b,b1).w || eq(c,c1).w));
interp_restriction_lv4_left.x = (e.x!=g2.x && d2.x!=g2.x && (eq(d0,d2).x || eq(g0,g2).x));
interp_restriction_lv4_left.y = (e.y!=g2.y && d2.y!=g2.y && (eq(d0,d2).y || eq(g0,g2).y));
interp_restriction_lv4_left.z = (e.z!=g2.z && d2.z!=g2.z && (eq(d0,d2).z || eq(g0,g2).z));
interp_restriction_lv4_left.w = (e.w!=g2.w && d2.w!=g2.w && (eq(d0,d2).w || eq(g0,g2).w));
interp_restriction_lv4_up.x = (e.x!=c3.x && b3.x!=c3.x && (eq(b1,b3).x || eq(c1,c3).x));
interp_restriction_lv4_up.y = (e.y!=c3.y && b3.y!=c3.y && (eq(b1,b3).y || eq(c1,c3).y));
interp_restriction_lv4_up.z = (e.z!=c3.z && b3.z!=c3.z && (eq(b1,b3).z || eq(c1,c3).z));
interp_restriction_lv4_up.w = (e.w!=c3.w && b3.w!=c3.w && (eq(b1,b3).w || eq(c1,c3).w));
vec4 wd1 = weighted_distance( e, c, g, i, h5, f4, h, f);
vec4 wd2 = weighted_distance( h, d, i5, f, i4, b, e, i);
edr0.x = (wd1.x <= wd2.x) && interp_restriction_lv1.x;
edr0.y = (wd1.y <= wd2.y) && interp_restriction_lv1.y;
edr0.z = (wd1.z <= wd2.z) && interp_restriction_lv1.z;
edr0.w = (wd1.w <= wd2.w) && interp_restriction_lv1.w;
edr.x = (wd1.x < wd2.x) && interp_restriction_lv1.x && ( !eq(f,b).x && !id(f,c,f,b).x || !eq(h,d).x && !id(h,g,h,d).x || eq(e,g).x || eq(e,c).x);
edr.y = (wd1.y < wd2.y) && interp_restriction_lv1.y && ( !eq(f,b).y && !id(f,c,f,b).y || !eq(h,d).y && !id(h,g,h,d).y || eq(e,g).y || eq(e,c).y);
edr.z = (wd1.z < wd2.z) && interp_restriction_lv1.z && ( !eq(f,b).z && !id(f,c,f,b).z || !eq(h,d).z && !id(h,g,h,d).z || eq(e,g).z || eq(e,c).z);
edr.w = (wd1.w < wd2.w) && interp_restriction_lv1.w && ( !eq(f,b).w && !id(f,c,f,b).w || !eq(h,d).w && !id(h,g,h,d).w || eq(e,g).w || eq(e,c).w);
edr_left.x = ((cf2*df(f,g).x) <= df(h,c).x) && interp_restriction_lv2_left.x && edr.x;
edr_left.y = ((cf2*df(f,g).y) <= df(h,c).y) && interp_restriction_lv2_left.y && edr.y;
edr_left.z = ((cf2*df(f,g).z) <= df(h,c).z) && interp_restriction_lv2_left.z && edr.z;
edr_left.w = ((cf2*df(f,g).w) <= df(h,c).w) && interp_restriction_lv2_left.w && edr.w;
edr_up.x = (df(f,g).x >= (cf2*df(h,c).x)) && interp_restriction_lv2_up.x && edr.x;
edr_up.y = (df(f,g).y >= (cf2*df(h,c).y)) && interp_restriction_lv2_up.y && edr.y;
edr_up.z = (df(f,g).z >= (cf2*df(h,c).z)) && interp_restriction_lv2_up.z && edr.z;
edr_up.w = (df(f,g).w >= (cf2*df(h,c).w)) && interp_restriction_lv2_up.w && edr.w;
edr3_left.x = ((cf3*df(f,g0).x) <= df(h,c1).x) && interp_restriction_lv3_left.x && edr_left.x;
edr3_left.y = ((cf3*df(f,g0).y) <= df(h,c1).y) && interp_restriction_lv3_left.y && edr_left.y;
edr3_left.z = ((cf3*df(f,g0).z) <= df(h,c1).z) && interp_restriction_lv3_left.z && edr_left.z;
edr3_left.w = ((cf3*df(f,g0).w) <= df(h,c1).w) && interp_restriction_lv3_left.w && edr_left.w;
edr3_up.x = (df(f,g0).x >= (cf3*df(h,c1).x)) && interp_restriction_lv3_up.x && edr_up.x;
edr3_up.y = (df(f,g0).y >= (cf3*df(h,c1).y)) && interp_restriction_lv3_up.y && edr_up.y;
edr3_up.z = (df(f,g0).z >= (cf3*df(h,c1).z)) && interp_restriction_lv3_up.z && edr_up.z;
edr3_up.w = (df(f,g0).w >= (cf3*df(h,c1).w)) && interp_restriction_lv3_up.w && edr_up.w;
edr4_left.x = ((cf4*df(f,g2).x) <= df(h,c3).x) && interp_restriction_lv4_left.x && edr3_left.x;
edr4_left.y = ((cf4*df(f,g2).y) <= df(h,c3).y) && interp_restriction_lv4_left.y && edr3_left.y;
edr4_left.z = ((cf4*df(f,g2).z) <= df(h,c3).z) && interp_restriction_lv4_left.z && edr3_left.z;
edr4_left.w = ((cf4*df(f,g2).w) <= df(h,c3).w) && interp_restriction_lv4_left.w && edr3_left.w;
edr4_up.x = (df(f,g2).x >= (cf4*df(h,c3).x)) && interp_restriction_lv4_up.x && edr3_up.x;
edr4_up.y = (df(f,g2).y >= (cf4*df(h,c3).y)) && interp_restriction_lv4_up.y && edr3_up.y;
edr4_up.z = (df(f,g2).z >= (cf4*df(h,c3).z)) && interp_restriction_lv4_up.z && edr3_up.z;
edr4_up.w = (df(f,g2).w >= (cf4*df(h,c3).w)) && interp_restriction_lv4_up.w && edr3_up.w;
/* condensed
interp_restriction_lv2_left = or(and(and(notEqual(e,g) , notEqual(d,g)) , eq(e, d)) , eq(h, g));
interp_restriction_lv2_up = or(and(and(notEqual(e,c) , notEqual(b,c)) , eq(e, b)) , eq(f, c));
interp_restriction_lv3_left = or(and(and(notEqual(e,g0) , notEqual(d0,g0)) , eq(d,d0)) , eq(g,g0));
interp_restriction_lv3_up = or(and(and(notEqual(e,c1) , notEqual(b1,c1)) , eq(b,b1)) , eq(c,c1));
interp_restriction_lv4_left = or(and(and(notEqual(e,g2) , notEqual(d2,g2)) , eq(d0,d2)) , eq(g0,g2));
interp_restriction_lv4_up = or(and(and(notEqual(e,c3) , notEqual(b3,c3)) , eq(b1,b3)) , eq(c1,c3));
vec4 wd1 = weighted_distance( e, c, g, i, h5, f4, h, f);
vec4 wd2 = weighted_distance( h, d, i5, f, i4, b, e, i);
bvec4 comp1 = and(not(eq(h,d)) , not(id(h,g,h,d)));
bvec4 comp2 = and(not(eq(f,b)) , not(id(f,c,f,b)));
edr0 = and(lessThanEqual(wd1 , wd2) , interp_restriction_lv1);
edr = and(lessThan(wd1 , wd2) , and(interp_restriction_lv1 , ( or(comp2 , or(comp1 , or(eq(e,g) , eq(e,c)))) ) ));
edr_left = and(lessThanEqual((cf2*df(f,g)) , df(h,c)) , and(interp_restriction_lv2_left , edr));
edr_up = and(greaterThanEqual(df(f,g) , (cf2*df(h,c))) , and(interp_restriction_lv2_up , edr));
edr3_left = and(lessThanEqual((cf3*df(f,g0)) , df(h,c1)) , and(interp_restriction_lv3_left , edr_left));
edr3_up = and(greaterThanEqual(df(f,g0) , (cf3*df(h,c1))) , and(interp_restriction_lv3_up , edr_up));
edr4_left = and(lessThanEqual((cf4*df(f,g2)) , df(h,c3)) , and(interp_restriction_lv4_left , edr3_left));
edr4_up = and(greaterThanEqual(df(f,g2) , (cf4*df(h,c3))) , and(interp_restriction_lv4_up , edr3_up));
*/
vec4 info;
info.x = (edr0.x == true) ? 1.0 : 0.0;
info.y = (edr0.y == true) ? 1.0 : 0.0;
info.z = (edr0.z == true) ? 1.0 : 0.0;
info.w = (edr0.w == true) ? 1.0 : 0.0;
info.x = (edr.x == true) ? 2.0 : info.x;
info.y = (edr.y == true) ? 2.0 : info.y;
info.z = (edr.z == true) ? 2.0 : info.z;
info.w = (edr.w == true) ? 2.0 : info.w;
info.x = and(edr_up , not(edr_left)).x == true ? 3.0 : info.x;
info.y = and(edr_up , not(edr_left)).y == true ? 3.0 : info.y;
info.z = and(edr_up , not(edr_left)).z == true ? 3.0 : info.z;
info.w = and(edr_up , not(edr_left)).w == true ? 3.0 : info.w;
info.x = and(edr_left , not(edr_up)).x == true ? 4.0 : info.x;
info.y = and(edr_left , not(edr_up)).y == true ? 4.0 : info.y;
info.z = and(edr_left , not(edr_up)).z == true ? 4.0 : info.z;
info.w = and(edr_left , not(edr_up)).w == true ? 4.0 : info.w;
info.x = and(edr3_up , not(edr3_left)).x == true ? 5.0 : info.x;
info.y = and(edr3_up , not(edr3_left)).y == true ? 5.0 : info.y;
info.z = and(edr3_up , not(edr3_left)).z == true ? 5.0 : info.z;
info.w = and(edr3_up , not(edr3_left)).w == true ? 5.0 : info.w;
info.x = and(edr3_left , not(edr3_up)).x == true ? 6.0 : info.x;
info.y = and(edr3_left , not(edr3_up)).y == true ? 6.0 : info.y;
info.z = and(edr3_left , not(edr3_up)).z == true ? 6.0 : info.z;
info.w = and(edr3_left , not(edr3_up)).w == true ? 6.0 : info.w;
info.x = and(edr4_up , not(edr4_left)).x == true ? 7.0 : info.x;
info.y = and(edr4_up , not(edr4_left)).y == true ? 7.0 : info.y;
info.z = and(edr4_up , not(edr4_left)).z == true ? 7.0 : info.z;
info.w = and(edr4_up , not(edr4_left)).w == true ? 7.0 : info.w;
info.x = and(edr4_left , not(edr4_up)).x == true ? 8.0 : info.x;
info.y = and(edr4_left , not(edr4_up)).y == true ? 8.0 : info.y;
info.z = and(edr4_left , not(edr4_up)).z == true ? 8.0 : info.z;
info.w = and(edr4_left , not(edr4_up)).w == true ? 8.0 : info.w;
FragColor = vec4(remapTo01(info, maximo));
}