1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
|
#version 310 es
layout (local_size_x = 8, local_size_y = 8) in;
layout (binding = 0) readonly buffer In0BufY {
uvec2 data[];
} in0_buf_y;
layout (binding = 1) readonly buffer In0BufUV {
uvec2 data[];
} in0_buf_uv;
layout (binding = 2) readonly buffer In1BufY {
uvec2 data[];
} in1_buf_y;
layout (binding = 3) readonly buffer In1BufUV {
uvec2 data[];
} in1_buf_uv;
layout (binding = 4) writeonly buffer OutBufY {
uvec2 data[];
} out_buf_y;
layout (binding = 5) writeonly buffer OutBufUV {
uvec2 data[];
} out_buf_uv;
layout (binding = 6) readonly buffer MaskBuf {
uvec2 data[];
} mask_buf;
layout (push_constant) uniform PushConsts {
uint in_img_width;
} prop;
void main ()
{
uvec2 g_id = gl_GlobalInvocationID.xy;
g_id.x = clamp (g_id.x, 0u, prop.in_img_width - 1u);
uvec2 mask = mask_buf.data[g_id.x];
vec4 mask0 = unpackUnorm4x8 (mask.x);
vec4 mask1 = unpackUnorm4x8 (mask.y);
uint y_idx = g_id.y * 2u * prop.in_img_width + g_id.x;
uvec2 in0_y = in0_buf_y.data[y_idx];
vec4 in0_y0 = unpackUnorm4x8 (in0_y.x);
vec4 in0_y1 = unpackUnorm4x8 (in0_y.y);
uvec2 in1_y = in1_buf_y.data[y_idx];
vec4 in1_y0 = unpackUnorm4x8 (in1_y.x);
vec4 in1_y1 = unpackUnorm4x8 (in1_y.y);
vec4 out_y0 = (in0_y0 - in1_y0) * mask0 + in1_y0;
vec4 out_y1 = (in0_y1 - in1_y1) * mask1 + in1_y1;
out_y0 = clamp (out_y0, 0.0f, 1.0f);
out_y1 = clamp (out_y1, 0.0f, 1.0f);
out_buf_y.data[y_idx] = uvec2 (packUnorm4x8 (out_y0), packUnorm4x8 (out_y1));
y_idx += prop.in_img_width;
in0_y = in0_buf_y.data[y_idx];
in0_y0 = unpackUnorm4x8 (in0_y.x);
in0_y1 = unpackUnorm4x8 (in0_y.y);
in1_y = in1_buf_y.data[y_idx];
in1_y0 = unpackUnorm4x8 (in1_y.x);
in1_y1 = unpackUnorm4x8 (in1_y.y);
out_y0 = (in0_y0 - in1_y0) * mask0 + in1_y0;
out_y1 = (in0_y1 - in1_y1) * mask1 + in1_y1;
out_y0 = clamp (out_y0, 0.0f, 1.0f);
out_y1 = clamp (out_y1, 0.0f, 1.0f);
out_buf_y.data[y_idx] = uvec2 (packUnorm4x8 (out_y0), packUnorm4x8 (out_y1));
uint uv_idx = g_id.y * prop.in_img_width + g_id.x;
uvec2 in0_uv = in0_buf_uv.data[uv_idx];
vec4 in0_uv0 = unpackUnorm4x8 (in0_uv.x);
vec4 in0_uv1 = unpackUnorm4x8 (in0_uv.y);
uvec2 in1_uv = in1_buf_uv.data[uv_idx];
vec4 in1_uv0 = unpackUnorm4x8 (in1_uv.x);
vec4 in1_uv1 = unpackUnorm4x8 (in1_uv.y);
mask0.yw = mask0.xz;
mask1.yw = mask1.xz;
vec4 out_uv0 = (in0_uv0 - in1_uv0) * mask0 + in1_uv0;
vec4 out_uv1 = (in0_uv1 - in1_uv1) * mask1 + in1_uv1;
out_uv0 = clamp (out_uv0, 0.0f, 1.0f);
out_uv1 = clamp (out_uv1, 0.0f, 1.0f);
out_buf_uv.data[uv_idx] = uvec2 (packUnorm4x8 (out_uv0), packUnorm4x8 (out_uv1));
}
|