mirror of
https://git.ffmpeg.org/ffmpeg.git
synced 2026-03-14 00:07:50 +01:00
259 lines
7.8 KiB
GLSL
259 lines
7.8 KiB
GLSL
/*
|
|
* FFv1 codec
|
|
*
|
|
* Copyright (c) 2024 Lynne <dev@lynne.ee>
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#ifndef VULKAN_FFV1_COMMON_H
|
|
#define VULKAN_FFV1_COMMON_H
|
|
|
|
#ifdef GOLOMB
|
|
#include "ffv1_vlc.glsl"
|
|
#endif
|
|
|
|
#define MAX_QUANT_TABLES 8
|
|
#define MAX_CONTEXT_INPUTS 5
|
|
#define MAX_QUANT_TABLE_SIZE 256
|
|
#define MAX_QUANT_TABLE_MASK (MAX_QUANT_TABLE_SIZE - 1)
|
|
|
|
layout (constant_id = 0) const int rgb_linecache = 2;
|
|
layout (constant_id = 1) const bool has_crc = false;
|
|
layout (constant_id = 2) const int version = 0;
|
|
layout (constant_id = 3) const int quant_table_count = 0;
|
|
layout (constant_id = 4) const bool has_extend_lookup = false;
|
|
|
|
layout (constant_id = 5) const int rct_offset = 0;
|
|
layout (constant_id = 6) const int colorspace = 0;
|
|
layout (constant_id = 7) const bool transparency = false;
|
|
layout (constant_id = 8) const bool planar_rgb = false;
|
|
layout (constant_id = 9) const int codec_planes = 0;
|
|
layout (constant_id = 10) const int color_planes = 0;
|
|
layout (constant_id = 11) const int planes = 0;
|
|
layout (constant_id = 12) const int bits = 0;
|
|
|
|
layout (constant_id = 13) const int chroma_shift_x = 0;
|
|
layout (constant_id = 14) const int chroma_shift_y = 0;
|
|
const ivec2 chroma_shift = ivec2(chroma_shift_x, chroma_shift_y);
|
|
|
|
/* Encoder-only */
|
|
layout (constant_id = 15) const bool force_pcm = false;
|
|
layout (constant_id = 16) const bool rct_search = false;
|
|
layout (constant_id = 17) const uint context_model = 0;
|
|
|
|
layout (push_constant, scalar) uniform pushConstants {
|
|
u8buf slice_data;
|
|
|
|
bool extend_lookup[MAX_QUANT_TABLES];
|
|
uint16_t context_count[MAX_QUANT_TABLES];
|
|
|
|
ivec4 fmt_lut;
|
|
u16vec2 img_size;
|
|
|
|
uint plane_state_size;
|
|
bool key_frame;
|
|
uint32_t crcref;
|
|
int micro_version;
|
|
|
|
/* Encoder-only */
|
|
ivec2 sar;
|
|
int pic_mode;
|
|
uint slice_size_max;
|
|
};
|
|
|
|
#include "rangecoder.glsl"
|
|
|
|
#if !defined(RGB)
|
|
#define TYPE int16_t
|
|
#define VTYPE2 i16vec2
|
|
#define VTYPE3 i16vec3
|
|
#else
|
|
#define TYPE int32_t
|
|
#define VTYPE2 i32vec2
|
|
#define VTYPE3 i32vec3
|
|
#endif
|
|
|
|
struct SliceContext {
|
|
RangeCoder c;
|
|
|
|
ivec2 slice_dim;
|
|
ivec2 slice_pos;
|
|
ivec2 slice_rct_coef;
|
|
u8vec3 quant_table_idx;
|
|
|
|
uint slice_coding_mode;
|
|
bool slice_reset_contexts;
|
|
};
|
|
|
|
#if !defined(SB_QUALI)
|
|
#if (defined(ENCODE) || defined(DECODE))
|
|
#define SB_QUALI readonly
|
|
#else
|
|
#define SB_QUALI
|
|
#endif
|
|
#endif
|
|
|
|
layout (set = 1, binding = 0, scalar) SB_QUALI buffer slice_ctx_buf {
|
|
SliceContext slice_ctx[];
|
|
};
|
|
|
|
uint slice_coord(uint width, uint sx, uint num_h_slices, uint chroma_shift)
|
|
{
|
|
uint mpw = 1 << chroma_shift;
|
|
uint awidth = align(width, mpw);
|
|
|
|
if ((version < 4) || ((version == 4) && (micro_version < 3)))
|
|
return width * sx / num_h_slices;
|
|
|
|
sx = (2 * awidth * sx + num_h_slices * mpw) / (2 * num_h_slices * mpw) * mpw;
|
|
if (sx == awidth)
|
|
sx = width;
|
|
|
|
return sx;
|
|
}
|
|
|
|
#if defined(ENCODE) || defined(DECODE)
|
|
|
|
layout (set = 0, binding = 1, scalar) readonly uniform quant_buf {
|
|
int16_t quant_table[MAX_QUANT_TABLES]
|
|
[MAX_CONTEXT_INPUTS]
|
|
[MAX_QUANT_TABLE_SIZE];
|
|
};
|
|
|
|
/* -1, { -1, 0 } */
|
|
int predict(int L, ivec2 top)
|
|
{
|
|
return mid_pred(L, L + top[1] - top[0], top[1]);
|
|
}
|
|
|
|
const uint32_t log2_run[41] = {
|
|
0, 0, 0, 0, 1, 1, 1, 1,
|
|
2, 2, 2, 2, 3, 3, 3, 3,
|
|
4, 4, 5, 5, 6, 6, 7, 7,
|
|
8, 9, 10, 11, 12, 13, 14, 15,
|
|
16, 17, 18, 19, 20, 21, 22, 23,
|
|
24,
|
|
};
|
|
|
|
shared VTYPE2 linecache;
|
|
|
|
#ifdef RGB
|
|
#define RGB_LBUF (rgb_linecache - 1)
|
|
#define LADDR(p) (ivec2((p).x, ((p).y & RGB_LBUF)))
|
|
|
|
ivec2 get_pred(readonly uimage2D pred, ivec2 sp, ivec2 off,
|
|
uint comp, int sw, uint8_t quant_table_idx, bool extend_lookup)
|
|
{
|
|
ivec2 yoff_border1 = expectEXT(off.x == 0, false) ? off + ivec2(1, -1) : off;
|
|
|
|
/* Thanks to the same coincidence as below, we can skip checking if off == 0, 1 */
|
|
VTYPE3 top = VTYPE3(TYPE(imageLoad(pred, sp + LADDR(yoff_border1 + ivec2(-1, -1)))[comp]),
|
|
TYPE(imageLoad(pred, sp + LADDR(off + ivec2(0, -1)))[comp]),
|
|
TYPE(imageLoad(pred, sp + LADDR(off + ivec2(min(1, sw - off.x - 1), -1)))[comp]));
|
|
|
|
/* Normally, we'd need to check if off != ivec2(0, 0) here, since otherwise, we must
|
|
* return zero. However, ivec2(-1, 0) + ivec2(1, -1) == ivec2(0, -1), e.g. previous
|
|
* row, 0 offset, same slice, which is zero since we zero out the buffer for RGB */
|
|
TYPE cur = linecache[1];
|
|
|
|
int base = quant_table[quant_table_idx][0][(cur - top[0]) & MAX_QUANT_TABLE_MASK] +
|
|
quant_table[quant_table_idx][1][(top[0] - top[1]) & MAX_QUANT_TABLE_MASK] +
|
|
quant_table[quant_table_idx][2][(top[1] - top[2]) & MAX_QUANT_TABLE_MASK];
|
|
|
|
if (has_extend_lookup && extend_lookup) {
|
|
TYPE cur2 = linecache[0];
|
|
base += quant_table[quant_table_idx][3][(cur2 - cur) & MAX_QUANT_TABLE_MASK];
|
|
|
|
/* top-2 became current upon swap when rgb_linecache == 2 */
|
|
ivec2 top2_off = off;
|
|
if (rgb_linecache != 2)
|
|
top2_off += ivec2(0, -2);
|
|
|
|
TYPE top2 = TYPE(imageLoad(pred, sp + LADDR(top2_off))[comp]);
|
|
base += quant_table[quant_table_idx][4][(top2 - top[1]) & MAX_QUANT_TABLE_MASK];
|
|
}
|
|
|
|
/* context, prediction */
|
|
return ivec2(base, predict(cur, VTYPE2(top)));
|
|
}
|
|
|
|
#else
|
|
|
|
#define LADDR(p) (p)
|
|
|
|
ivec2 get_pred(readonly uimage2D pred, ivec2 sp, ivec2 off,
|
|
uint comp, int sw, uint8_t quant_table_idx, bool extend_lookup)
|
|
{
|
|
ivec2 yoff_border1 = off.x == 0 ? ivec2(1, -1) : ivec2(0, 0);
|
|
sp += off;
|
|
|
|
VTYPE3 top = VTYPE3(TYPE(0),
|
|
TYPE(0),
|
|
TYPE(0));
|
|
if (off.y > 0 && off != ivec2(0, 1))
|
|
top[0] = TYPE(imageLoad(pred, sp + ivec2(-1, -1) + yoff_border1)[comp]);
|
|
if (off.y > 0) {
|
|
top[1] = TYPE(imageLoad(pred, sp + ivec2(0, -1))[comp]);
|
|
top[2] = TYPE(imageLoad(pred, sp + ivec2(min(1, sw - off.x - 1), -1))[comp]);
|
|
}
|
|
|
|
TYPE cur = linecache[1];
|
|
|
|
int base = quant_table[quant_table_idx][0][(cur - top[0]) & MAX_QUANT_TABLE_MASK] +
|
|
quant_table[quant_table_idx][1][(top[0] - top[1]) & MAX_QUANT_TABLE_MASK] +
|
|
quant_table[quant_table_idx][2][(top[1] - top[2]) & MAX_QUANT_TABLE_MASK];
|
|
|
|
if (has_extend_lookup && extend_lookup) {
|
|
TYPE cur2 = linecache[0];
|
|
base += quant_table[quant_table_idx][3][(cur2 - cur) & MAX_QUANT_TABLE_MASK];
|
|
|
|
TYPE top2 = TYPE(0);
|
|
if (off.y > 1)
|
|
top2 = TYPE(imageLoad(pred, sp + ivec2(0, -2))[comp]);
|
|
base += quant_table[quant_table_idx][4][(top2 - top[1]) & MAX_QUANT_TABLE_MASK];
|
|
}
|
|
|
|
/* context, prediction */
|
|
return ivec2(base, predict(cur, VTYPE2(top)));
|
|
}
|
|
|
|
#endif /* RGB */
|
|
|
|
void linecache_load(readonly uimage2D src, ivec2 sp, int y, uint comp)
|
|
{
|
|
if (gl_LocalInvocationID.x == 0) {
|
|
linecache[0] = TYPE(0);
|
|
} else if (gl_LocalInvocationID.x == 1) {
|
|
TYPE c = TYPE(0);
|
|
if (y > 0)
|
|
c = TYPE(imageLoad(src, sp + LADDR(ivec2(0, y - 1)))[comp]);
|
|
linecache[1] = c;
|
|
}
|
|
barrier();
|
|
}
|
|
|
|
void linecache_next(TYPE cur)
|
|
{
|
|
linecache[0] = linecache[1];
|
|
linecache[1] = cur;
|
|
}
|
|
|
|
#endif /* ENCODE || DECODE */
|
|
|
|
#endif /* VULKAN_FFV1_COMMON_H */
|