Files

63 lines
2.1 KiB
GLSL

/*
* Copyright (c) 2021-2022 Wu Jianhua <jianhua.wu@intel.com>
* Copyright (c) 2026 Lynne <dev@lynne.ee>
*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#pragma shader_stage(compute)
#extension GL_EXT_shader_image_load_formatted : require
#extension GL_EXT_scalar_block_layout : require
#extension GL_EXT_nonuniform_qualifier : require
layout (local_size_x_id = 253, local_size_y_id = 254, local_size_z_id = 255) in;
layout (set = 0, binding = 0) uniform readonly image2D input_img[];
layout (set = 0, binding = 1) uniform writeonly image2D output_img[];
layout (set = 1, binding = 0, scalar) readonly buffer kernel_buf {
float kernel[];
};
layout (push_constant, scalar) uniform pushConstants {
int planes;
};
#define P_IDX nonuniformEXT(gl_WorkGroupID.z)
void main()
{
if (!bool(planes & (1 << gl_WorkGroupID.z)))
return;
ivec2 pos = ivec2(gl_GlobalInvocationID.xy);
ivec2 size = imageSize(input_img[P_IDX]);
if (any(greaterThanEqual(pos, size)))
return;
vec4 sum = imageLoad(input_img[P_IDX], pos) * kernel[0];
for(int i = 1; i < kernel.length(); i++) {
ivec2 offs = gl_WorkGroupSize.x > gl_WorkGroupSize.y ? ivec2(i, 0) :
ivec2(0, i);
sum += imageLoad(input_img[P_IDX], pos + offs) * kernel[i];
sum += imageLoad(input_img[P_IDX], pos - offs) * kernel[i];
}
imageStore(output_img[P_IDX], pos, sum);
}