From 2e2e08a35b479c5a2049a0f7eaf20e00aa78e923 Mon Sep 17 00:00:00 2001 From: "Ronald S. Bultje" Date: Wed, 6 Apr 2016 14:08:21 -0400 Subject: lavfi: new colorspace conversion filter. The intent here is similar to colormatrix, but it's LGPLv2.1-or-later (instead of GPLv2.0) and supports gamma/chromaticity correction. --- libavfilter/Makefile | 1 + libavfilter/allfilters.c | 1 + libavfilter/colorspacedsp.c | 131 ++++ libavfilter/colorspacedsp.h | 51 ++ libavfilter/colorspacedsp_template.c | 214 ++++++ libavfilter/colorspacedsp_yuv2yuv_template.c | 98 +++ libavfilter/vf_colorspace.c | 1024 ++++++++++++++++++++++++++ 7 files changed, 1520 insertions(+) create mode 100644 libavfilter/colorspacedsp.c create mode 100644 libavfilter/colorspacedsp.h create mode 100644 libavfilter/colorspacedsp_template.c create mode 100644 libavfilter/colorspacedsp_yuv2yuv_template.c create mode 100644 libavfilter/vf_colorspace.c (limited to 'libavfilter') diff --git a/libavfilter/Makefile b/libavfilter/Makefile index 3a3de48821..91075142df 100644 --- a/libavfilter/Makefile +++ b/libavfilter/Makefile @@ -131,6 +131,7 @@ OBJS-$(CONFIG_COLORCHANNELMIXER_FILTER) += vf_colorchannelmixer.o OBJS-$(CONFIG_COLORKEY_FILTER) += vf_colorkey.o OBJS-$(CONFIG_COLORLEVELS_FILTER) += vf_colorlevels.o OBJS-$(CONFIG_COLORMATRIX_FILTER) += vf_colormatrix.o +OBJS-$(CONFIG_COLORSPACE_FILTER) += vf_colorspace.o colorspacedsp.o OBJS-$(CONFIG_CONVOLUTION_FILTER) += vf_convolution.o OBJS-$(CONFIG_COPY_FILTER) += vf_copy.o OBJS-$(CONFIG_COREIMAGE_FILTER) += vf_coreimage.o diff --git a/libavfilter/allfilters.c b/libavfilter/allfilters.c index b6f4a2c74f..5c31ff2e98 100644 --- a/libavfilter/allfilters.c +++ b/libavfilter/allfilters.c @@ -152,6 +152,7 @@ void avfilter_register_all(void) REGISTER_FILTER(COLORKEY, colorkey, vf); REGISTER_FILTER(COLORLEVELS, colorlevels, vf); REGISTER_FILTER(COLORMATRIX, colormatrix, vf); + REGISTER_FILTER(COLORSPACE, colorspace, vf); REGISTER_FILTER(CONVOLUTION, convolution, vf); REGISTER_FILTER(COPY, copy, vf); REGISTER_FILTER(COREIMAGE, coreimage, vf); diff --git a/libavfilter/colorspacedsp.c b/libavfilter/colorspacedsp.c new file mode 100644 index 0000000000..51a7c1ddb7 --- /dev/null +++ b/libavfilter/colorspacedsp.c @@ -0,0 +1,131 @@ +/* + * Copyright (c) 2016 Ronald S. Bultje + * + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#include "colorspacedsp.h" + +#define SS_W 0 +#define SS_H 0 + +#define BIT_DEPTH 8 +#include "colorspacedsp_template.c" + +#undef BIT_DEPTH +#define BIT_DEPTH 10 +#include "colorspacedsp_template.c" + +#undef BIT_DEPTH +#define BIT_DEPTH 12 +#include "colorspacedsp_template.c" + +#undef SS_W +#undef SS_H + +#define SS_W 1 +#define SS_H 0 + +#undef BIT_DEPTH +#define BIT_DEPTH 8 +#include "colorspacedsp_template.c" + +#undef BIT_DEPTH +#define BIT_DEPTH 10 +#include "colorspacedsp_template.c" + +#undef BIT_DEPTH +#define BIT_DEPTH 12 +#include "colorspacedsp_template.c" + +#undef SS_W +#undef SS_H + +#define SS_W 1 +#define SS_H 1 + +#undef BIT_DEPTH +#define BIT_DEPTH 8 +#include "colorspacedsp_template.c" + +#undef BIT_DEPTH +#define BIT_DEPTH 10 +#include "colorspacedsp_template.c" + +#undef BIT_DEPTH +#define BIT_DEPTH 12 +#include "colorspacedsp_template.c" + +static void multiply3x3_c(int16_t *buf[3], ptrdiff_t stride, + int w, int h, const int16_t m[3][3][8]) +{ + int y, x; + int16_t *buf0 = buf[0], *buf1 = buf[1], *buf2 = buf[2]; + + for (y = 0; y < h; y++) { + for (x = 0; x < w; x++) { + int v0 = buf0[x], v1 = buf1[x], v2 = buf2[x]; + + buf0[x] = av_clip_int16((m[0][0][0] * v0 + m[0][1][0] * v1 + + m[0][2][0] * v2 + 8192) >> 14); + buf1[x] = av_clip_int16((m[1][0][0] * v0 + m[1][1][0] * v1 + + m[1][2][0] * v2 + 8192) >> 14); + buf2[x] = av_clip_int16((m[2][0][0] * v0 + m[2][1][0] * v1 + + m[2][2][0] * v2 + 8192) >> 14); + } + + buf0 += stride; + buf1 += stride; + buf2 += stride; + } +} + +void ff_colorspacedsp_init(ColorSpaceDSPContext *dsp) +{ +#define init_yuv2rgb_fn(idx, bit) \ + dsp->yuv2rgb[idx][0] = yuv2rgb_444p##bit##_c; \ + dsp->yuv2rgb[idx][1] = yuv2rgb_422p##bit##_c; \ + dsp->yuv2rgb[idx][2] = yuv2rgb_420p##bit##_c + + init_yuv2rgb_fn(0, 8); + init_yuv2rgb_fn(1, 10); + init_yuv2rgb_fn(2, 12); + +#define init_rgb2yuv_fn(idx, bit) \ + dsp->rgb2yuv[idx][0] = rgb2yuv_444p##bit##_c; \ + dsp->rgb2yuv[idx][1] = rgb2yuv_422p##bit##_c; \ + dsp->rgb2yuv[idx][2] = rgb2yuv_420p##bit##_c + + init_rgb2yuv_fn(0, 8); + init_rgb2yuv_fn(1, 10); + init_rgb2yuv_fn(2, 12); + +#define init_yuv2yuv_fn(idx1, idx2, bit1, bit2) \ + dsp->yuv2yuv[idx1][idx2][0] = yuv2yuv_444p##bit1##to##bit2##_c; \ + dsp->yuv2yuv[idx1][idx2][1] = yuv2yuv_422p##bit1##to##bit2##_c; \ + dsp->yuv2yuv[idx1][idx2][2] = yuv2yuv_420p##bit1##to##bit2##_c +#define init_yuv2yuv_fns(idx1, bit1) \ + init_yuv2yuv_fn(idx1, 0, bit1, 8); \ + init_yuv2yuv_fn(idx1, 1, bit1, 10); \ + init_yuv2yuv_fn(idx1, 2, bit1, 12) + + init_yuv2yuv_fns(0, 8); + init_yuv2yuv_fns(1, 10); + init_yuv2yuv_fns(2, 12); + + dsp->multiply3x3 = multiply3x3_c; +} diff --git a/libavfilter/colorspacedsp.h b/libavfilter/colorspacedsp.h new file mode 100644 index 0000000000..357111752b --- /dev/null +++ b/libavfilter/colorspacedsp.h @@ -0,0 +1,51 @@ +/* + * Copyright (c) 2016 Ronald S. Bultje + * + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#ifndef AVFILTER_COLORSPACEDSP_H +#define AVFILTER_COLORSPACEDSP_H + +#include +#include + +typedef void (*yuv2rgb_fn)(int16_t *rgb[3], ptrdiff_t rgb_stride, + uint8_t *yuv[3], ptrdiff_t yuv_stride[3], + int w, int h, const int16_t yuv2rgb_coeffs[3][3][8], + const int16_t yuv_offset[8]); +typedef void (*rgb2yuv_fn)(uint8_t *yuv[3], ptrdiff_t yuv_stride[3], + int16_t *rgb[3], ptrdiff_t rgb_stride, + int w, int h, const int16_t rgb2yuv_coeffs[3][3][8], + const int16_t yuv_offset[8]); +typedef void (*yuv2yuv_fn)(uint8_t *yuv_out[3], ptrdiff_t yuv_out_stride[3], + uint8_t *yuv_in[3], ptrdiff_t yuv_in_stride[3], + int w, int h, const int16_t yuv2yuv_coeffs[3][3][8], + const int16_t yuv_offset[2][8]); + +typedef struct ColorSpaceDSPContext { + yuv2rgb_fn yuv2rgb[3 /* 0: 8bit, 1: 10bit, 2: 12bit */][3 /* 0: 444, 1: 422, 2: 420 */]; + rgb2yuv_fn rgb2yuv[3 /* 0: 8bit, 1: 10bit, 2: 12bit */][3 /* 0: 444, 1: 422, 2: 420 */]; + yuv2yuv_fn yuv2yuv[3 /* in_depth */][3 /* out_depth */][3 /* 0: 444, 1: 422, 2: 420 */]; + + void (*multiply3x3)(int16_t *data[3], ptrdiff_t stride, + int w, int h, const int16_t m[3][3][8]); +} ColorSpaceDSPContext; + +void ff_colorspacedsp_init(ColorSpaceDSPContext *dsp); + +#endif /* AVFILTER_COLORSPACEDSP_H */ diff --git a/libavfilter/colorspacedsp_template.c b/libavfilter/colorspacedsp_template.c new file mode 100644 index 0000000000..a32a0293f0 --- /dev/null +++ b/libavfilter/colorspacedsp_template.c @@ -0,0 +1,214 @@ +/* + * Copyright (c) 2016 Ronald S. Bultje + * + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#include "libavutil/avassert.h" + +#undef avg +#undef ss + +#if SS_W == 0 +#define ss 444 +#define avg(a,b,c,d) (a) +#elif SS_H == 0 +#define ss 422 +#define avg(a,b,c,d) ((a + b + 1) >> 1) +#else +#define ss 420 +#define avg(a,b,c,d) ((a + b + c + d + 2) >> 2) +#endif + +#undef fn +#undef fn2 +#undef fn3 +#define fn3(a,b,c) a##_##c##p##b##_c +#define fn2(a,b,c) fn3(a,b,c) +#define fn(a) fn2(a, BIT_DEPTH, ss) + +#undef pixel +#undef av_clip_pixel +#if BIT_DEPTH == 8 +#define pixel uint8_t +#define av_clip_pixel(x) av_clip_uint8(x) +#else +#define pixel uint16_t +#define av_clip_pixel(x) av_clip_uintp2(x, BIT_DEPTH) +#endif + +static void fn(yuv2rgb)(int16_t *rgb[3], ptrdiff_t rgb_stride, + uint8_t *_yuv[3], ptrdiff_t yuv_stride[3], + int w, int h, const int16_t yuv2rgb_coeffs[3][3][8], + const int16_t yuv_offset[8]) +{ + pixel **yuv = (pixel **) _yuv; + const pixel *yuv0 = yuv[0], *yuv1 = yuv[1], *yuv2 = yuv[2]; + int16_t *rgb0 = rgb[0], *rgb1 = rgb[1], *rgb2 = rgb[2]; + int y, x; + int cy = yuv2rgb_coeffs[0][0][0]; + int crv = yuv2rgb_coeffs[0][2][0]; + int cgu = yuv2rgb_coeffs[1][1][0]; + int cgv = yuv2rgb_coeffs[1][2][0]; + int cbu = yuv2rgb_coeffs[2][1][0]; + const int sh = BIT_DEPTH - 1, rnd = 1 << (sh - 1); + const int uv_offset = 128 << (BIT_DEPTH - 8); + + av_assert2(yuv2rgb_coeffs[0][1][0] == 0); + av_assert2(yuv2rgb_coeffs[2][2][0] == 0); + av_assert2(yuv2rgb_coeffs[1][0][0] == cy && yuv2rgb_coeffs[2][0][0] == cy); + + w = AV_CEIL_RSHIFT(w, SS_W); + h = AV_CEIL_RSHIFT(h, SS_H); + for (y = 0; y < h; y++) { + for (x = 0; x < w; x++) { + int y00 = yuv0[x << SS_W] - yuv_offset[0]; +#if SS_W == 1 + int y01 = yuv0[2 * x + 1] - yuv_offset[0]; +#if SS_H == 1 + int y10 = yuv0[yuv_stride[0] / sizeof(pixel) + 2 * x] - yuv_offset[0]; + int y11 = yuv0[yuv_stride[0] / sizeof(pixel) + 2 * x + 1] - yuv_offset[0]; +#endif +#endif + int u = yuv1[x] - uv_offset, v = yuv2[x] - uv_offset; + + rgb0[x << SS_W] = av_clip_int16((y00 * cy + crv * v + rnd) >> sh); +#if SS_W == 1 + rgb0[2 * x + 1] = av_clip_int16((y01 * cy + crv * v + rnd) >> sh); +#if SS_H == 1 + rgb0[2 * x + rgb_stride] = av_clip_int16((y10 * cy + crv * v + rnd) >> sh); + rgb0[2 * x + rgb_stride + 1] = av_clip_int16((y11 * cy + crv * v + rnd) >> sh); +#endif +#endif + + rgb1[x << SS_W] = av_clip_int16((y00 * cy + cgu * u + + cgv * v + rnd) >> sh); +#if SS_W == 1 + rgb1[2 * x + 1] = av_clip_int16((y01 * cy + cgu * u + + cgv * v + rnd) >> sh); +#if SS_H == 1 + rgb1[2 * x + rgb_stride] = av_clip_int16((y10 * cy + cgu * u + + cgv * v + rnd) >> sh); + rgb1[2 * x + rgb_stride + 1] = av_clip_int16((y11 * cy + cgu * u + + cgv * v + rnd) >> sh); +#endif +#endif + + rgb2[x << SS_W] = av_clip_int16((y00 * cy + cbu * u + rnd) >> sh); +#if SS_W == 1 + rgb2[2 * x + 1] = av_clip_int16((y01 * cy + cbu * u + rnd) >> sh); +#if SS_H == 1 + rgb2[2 * x + rgb_stride] = av_clip_int16((y10 * cy + cbu * u + rnd) >> sh); + rgb2[2 * x + rgb_stride + 1] = av_clip_int16((y11 * cy + cbu * u + rnd) >> sh); +#endif +#endif + } + + yuv0 += (yuv_stride[0] * (1 << SS_H)) / sizeof(pixel); + yuv1 += yuv_stride[1] / sizeof(pixel); + yuv2 += yuv_stride[2] / sizeof(pixel); + rgb0 += rgb_stride * (1 << SS_H); + rgb1 += rgb_stride * (1 << SS_H); + rgb2 += rgb_stride * (1 << SS_H); + } +} + +static void fn(rgb2yuv)(uint8_t *_yuv[3], ptrdiff_t yuv_stride[3], + int16_t *rgb[3], ptrdiff_t s, + int w, int h, const int16_t rgb2yuv_coeffs[3][3][8], + const int16_t yuv_offset[8]) +{ + pixel **yuv = (pixel **) _yuv; + pixel *yuv0 = yuv[0], *yuv1 = yuv[1], *yuv2 = yuv[2]; + const int16_t *rgb0 = rgb[0], *rgb1 = rgb[1], *rgb2 = rgb[2]; + int y, x; + const int sh = 29 - BIT_DEPTH; + const int rnd = 1 << (sh - 1); + int cry = rgb2yuv_coeffs[0][0][0]; + int cgy = rgb2yuv_coeffs[0][1][0]; + int cby = rgb2yuv_coeffs[0][2][0]; + int cru = rgb2yuv_coeffs[1][0][0]; + int cgu = rgb2yuv_coeffs[1][1][0]; + int cburv = rgb2yuv_coeffs[1][2][0]; + int cgv = rgb2yuv_coeffs[2][1][0]; + int cbv = rgb2yuv_coeffs[2][2][0]; + ptrdiff_t s0 = yuv_stride[0] / sizeof(pixel); + const int uv_offset = 128 << (BIT_DEPTH - 8); + + av_assert2(rgb2yuv_coeffs[1][2][0] == rgb2yuv_coeffs[2][0][0]); + w = AV_CEIL_RSHIFT(w, SS_W); + h = AV_CEIL_RSHIFT(h, SS_H); + for (y = 0; y < h; y++) { + for (x = 0; x < w; x++) { + int r00 = rgb0[x << SS_W], g00 = rgb1[x << SS_W], b00 = rgb2[x << SS_W]; +#if SS_W == 1 + int r01 = rgb0[x * 2 + 1], g01 = rgb1[x * 2 + 1], b01 = rgb2[x * 2 + 1]; +#if SS_H == 1 + int r10 = rgb0[x * 2 + 0 + s], g10 = rgb1[x * 2 + 0 + s], b10 = rgb2[x * 2 + 0 + s]; + int r11 = rgb0[x * 2 + 1 + s], g11 = rgb1[x * 2 + 1 + s], b11 = rgb2[x * 2 + 1 + s]; +#endif +#endif + + yuv0[x << SS_W] = av_clip_pixel(yuv_offset[0] + + ((r00 * cry + g00 * cgy + + b00 * cby + rnd) >> sh)); +#if SS_W == 1 + yuv0[x * 2 + 1] = av_clip_pixel(yuv_offset[0] + + ((r01 * cry + g01 * cgy + + b01 * cby + rnd) >> sh)); +#if SS_H == 1 + yuv0[x * 2 + 0 + s0] = av_clip_pixel(yuv_offset[0] + + ((r10 * cry + g10 * cgy + + b10 * cby + rnd) >> sh)); + yuv0[x * 2 + 1 + s0] = av_clip_pixel(yuv_offset[0] + + ((r11 * cry + g11 * cgy + + b11 * cby + rnd) >> sh)); +#endif +#endif + + yuv1[x] = av_clip_pixel(uv_offset + + ((avg(r00, r01, r10, r11) * cru + + avg(g00, g01, g10, g11) * cgu + + avg(b00, b01, b10, b11) * cburv + rnd) >> sh)); + yuv2[x] = av_clip_pixel(uv_offset + + ((avg(r00, r01, r10, r11) * cburv + + avg(g00, g01, g10, g11) * cgv + + avg(b00, b01, b10, b11) * cbv + rnd) >> sh)); + } + + yuv0 += s0 * (1 << SS_H); + yuv1 += yuv_stride[1] / sizeof(pixel); + yuv2 += yuv_stride[2] / sizeof(pixel); + rgb0 += s * (1 << SS_H); + rgb1 += s * (1 << SS_H); + rgb2 += s * (1 << SS_H); + } +} + +#undef IN_BIT_DEPTH +#undef OUT_BIT_DEPTH +#define OUT_BIT_DEPTH BIT_DEPTH +#define IN_BIT_DEPTH 8 +#include "colorspacedsp_yuv2yuv_template.c" + +#undef IN_BIT_DEPTH +#define IN_BIT_DEPTH 10 +#include "colorspacedsp_yuv2yuv_template.c" + +#undef IN_BIT_DEPTH +#define IN_BIT_DEPTH 12 +#include "colorspacedsp_yuv2yuv_template.c" diff --git a/libavfilter/colorspacedsp_yuv2yuv_template.c b/libavfilter/colorspacedsp_yuv2yuv_template.c new file mode 100644 index 0000000000..8b0d33a788 --- /dev/null +++ b/libavfilter/colorspacedsp_yuv2yuv_template.c @@ -0,0 +1,98 @@ +/* + * Copyright (c) 2016 Ronald S. Bultje + * + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#include "libavutil/avassert.h" + +#undef opixel +#define opixel pixel + +#undef ipixel +#if IN_BIT_DEPTH == 8 +#define ipixel uint8_t +#else +#define ipixel uint16_t +#endif + +#undef fn +#undef fn2 +#undef fn3 +#define fn3(a,b,c,d) a##_##d##p##b##to##c##_c +#define fn2(a,b,c,d) fn3(a,b,c,d) +#define fn(a) fn2(a, IN_BIT_DEPTH, OUT_BIT_DEPTH, ss) + +static void fn(yuv2yuv)(uint8_t *_dst[3], ptrdiff_t dst_stride[3], + uint8_t *_src[3], ptrdiff_t src_stride[3], + int w, int h, const int16_t c[3][3][8], + const int16_t yuv_offset[2][8]) +{ + opixel **dst = (opixel **) _dst; + ipixel **src = (ipixel **) _src; + const ipixel *src0 = src[0], *src1 = src[1], *src2 = src[2]; + opixel *dst0 = dst[0], *dst1 = dst[1], *dst2 = dst[2]; + int y, x; + const int sh = 14 + IN_BIT_DEPTH - OUT_BIT_DEPTH; + const int rnd = 1 << (sh - 1); + int y_off_in = yuv_offset[0][0]; + int y_off_out = yuv_offset[1][0] << sh; + const int uv_off_in = 128 << (IN_BIT_DEPTH - 8); + const int uv_off_out = rnd + (128 << (OUT_BIT_DEPTH - 8 + sh)); + int cyy = c[0][0][0], cyu = c[0][1][0], cyv = c[0][2][0]; + int cuu = c[1][1][0], cuv = c[1][2][0], cvu = c[2][1][0], cvv = c[2][2][0]; + + av_assert2(c[1][0][0] == 0); + av_assert2(c[2][0][0] == 0); + w = AV_CEIL_RSHIFT(w, SS_W); + h = AV_CEIL_RSHIFT(h, SS_H); + for (y = 0; y < h; y++) { + for (x = 0; x < w; x++) { + int y00 = src0[x << SS_W] - y_off_in; +#if SS_W == 1 + int y01 = src0[2 * x + 1] - y_off_in; +#if SS_H == 1 + int y10 = src0[src_stride[0] / sizeof(ipixel) + 2 * x] - y_off_in; + int y11 = src0[src_stride[0] / sizeof(ipixel) + 2 * x + 1] - y_off_in; +#endif +#endif + int u = src1[x] - uv_off_in, v = src2[x] - uv_off_in; + int uv_val = cyu * u + cyv * v + rnd + y_off_out; + + dst0[x << SS_W] = av_clip_pixel((cyy * y00 + uv_val) >> sh); +#if SS_W == 1 + dst0[x * 2 + 1] = av_clip_pixel((cyy * y01 + uv_val) >> sh); +#if SS_H == 1 + dst0[x * 2 + 0 + dst_stride[0] / sizeof(opixel)] = + av_clip_pixel((cyy * y10 + uv_val) >> sh); + dst0[x * 2 + 1 + dst_stride[0] / sizeof(opixel)] = + av_clip_pixel((cyy * y11 + uv_val) >> sh); +#endif +#endif + + dst1[x] = av_clip_pixel((u * cuu + v * cuv + uv_off_out) >> sh); + dst2[x] = av_clip_pixel((u * cvu + v * cvv + uv_off_out) >> sh); + } + + dst0 += (dst_stride[0] * (1 << SS_H)) / sizeof(opixel); + dst1 += dst_stride[1] / sizeof(opixel); + dst2 += dst_stride[2] / sizeof(opixel); + src0 += (src_stride[0] * (1 << SS_H)) / sizeof(ipixel); + src1 += src_stride[1] / sizeof(ipixel); + src2 += src_stride[2] / sizeof(ipixel); + } +} diff --git a/libavfilter/vf_colorspace.c b/libavfilter/vf_colorspace.c new file mode 100644 index 0000000000..bc26d8f1b7 --- /dev/null +++ b/libavfilter/vf_colorspace.c @@ -0,0 +1,1024 @@ +/* + * Copyright (c) 2016 Ronald S. Bultje + * + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +/* + * @file + * Convert between colorspaces. + */ + +#include "libavutil/avassert.h" +#include "libavutil/opt.h" +#include "libavutil/pixdesc.h" +#include "libavutil/pixfmt.h" + +#include "avfilter.h" +#include "colorspacedsp.h" +#include "formats.h" +#include "internal.h" +#include "video.h" + +enum Colorspace { + CS_UNSPECIFIED, + CS_BT470M, + CS_BT470BG, + CS_BT601_6_525, + CS_BT601_6_625, + CS_BT709, + CS_SMPTE170M, + CS_SMPTE240M, + CS_BT2020, + CS_NB, +}; + +enum Whitepoint { + WP_D65, + WP_C, + WP_NB, +}; + +static const enum AVColorTransferCharacteristic default_trc[CS_NB + 1] = { + [CS_UNSPECIFIED] = AVCOL_TRC_UNSPECIFIED, + [CS_BT470M] = AVCOL_TRC_GAMMA22, + [CS_BT470BG] = AVCOL_TRC_GAMMA28, + [CS_BT601_6_525] = AVCOL_TRC_SMPTE170M, + [CS_BT601_6_625] = AVCOL_TRC_SMPTE170M, + [CS_BT709] = AVCOL_TRC_BT709, + [CS_SMPTE170M] = AVCOL_TRC_SMPTE170M, + [CS_SMPTE240M] = AVCOL_TRC_SMPTE240M, + [CS_BT2020] = AVCOL_TRC_BT2020_10, + [CS_NB] = AVCOL_TRC_UNSPECIFIED, +}; + +static const enum AVColorPrimaries default_prm[CS_NB + 1] = { + [CS_UNSPECIFIED] = AVCOL_PRI_UNSPECIFIED, + [CS_BT470M] = AVCOL_PRI_BT470M, + [CS_BT470BG] = AVCOL_PRI_BT470BG, + [CS_BT601_6_525] = AVCOL_PRI_SMPTE170M, + [CS_BT601_6_625] = AVCOL_PRI_BT470BG, + [CS_BT709] = AVCOL_PRI_BT709, + [CS_SMPTE170M] = AVCOL_PRI_SMPTE170M, + [CS_SMPTE240M] = AVCOL_PRI_SMPTE240M, + [CS_BT2020] = AVCOL_PRI_BT2020, + [CS_NB] = AVCOL_PRI_UNSPECIFIED, +}; + +static const enum AVColorSpace default_csp[CS_NB + 1] = { + [CS_UNSPECIFIED] = AVCOL_SPC_UNSPECIFIED, + [CS_BT470M] = AVCOL_SPC_SMPTE170M, + [CS_BT470BG] = AVCOL_SPC_BT470BG, + [CS_BT601_6_525] = AVCOL_SPC_SMPTE170M, + [CS_BT601_6_625] = AVCOL_SPC_BT470BG, + [CS_BT709] = AVCOL_SPC_BT709, + [CS_SMPTE170M] = AVCOL_SPC_SMPTE170M, + [CS_SMPTE240M] = AVCOL_SPC_SMPTE240M, + [CS_BT2020] = AVCOL_SPC_BT2020_NCL, + [CS_NB] = AVCOL_SPC_UNSPECIFIED, +}; + +struct ColorPrimaries { + enum Whitepoint wp; + double xr, yr, xg, yg, xb, yb; +}; + +struct TransferCharacteristics { + double alpha, beta, gamma, delta; +}; + +struct LumaCoefficients { + double cr, cg, cb; +}; + +struct WhitepointCoefficients { + double xw, yw; +}; + +typedef struct ColorSpaceContext { + const AVClass *class; + + ColorSpaceDSPContext dsp; + + enum Colorspace user_all; + enum AVColorSpace in_csp, out_csp, user_csp; + enum AVColorRange in_rng, out_rng, user_rng; + enum AVColorTransferCharacteristic in_trc, out_trc, user_trc; + enum AVColorPrimaries in_prm, out_prm, user_prm; + enum AVPixelFormat in_format, user_format; + int fast_mode; + + int16_t *rgb[3]; + ptrdiff_t rgb_stride; + unsigned rgb_sz; + + const struct ColorPrimaries *in_primaries, *out_primaries; + int lrgb2lrgb_passthrough; + DECLARE_ALIGNED(16, int16_t, lrgb2lrgb_coeffs)[3][3][8]; + + const struct TransferCharacteristics *in_txchr, *out_txchr; + int rgb2rgb_passthrough; + int16_t *lin_lut, *delin_lut; + + const struct LumaCoefficients *in_lumacoef, *out_lumacoef; + int yuv2yuv_passthrough, yuv2yuv_fastmode; + DECLARE_ALIGNED(16, int16_t, yuv2rgb_coeffs)[3][3][8]; + DECLARE_ALIGNED(16, int16_t, rgb2yuv_coeffs)[3][3][8]; + DECLARE_ALIGNED(16, int16_t, yuv2yuv_coeffs)[3][3][8]; + DECLARE_ALIGNED(16, int16_t, yuv_offset)[2 /* in, out */][8]; + yuv2rgb_fn yuv2rgb; + rgb2yuv_fn rgb2yuv; + yuv2yuv_fn yuv2yuv; + double yuv2rgb_dbl_coeffs[3][3], rgb2yuv_dbl_coeffs[3][3]; + int in_y_rng, in_uv_rng, out_y_rng, out_uv_rng; +} ColorSpaceContext; + +// FIXME deal with odd width/heights (or just forbid it) +// FIXME faster linearize/delinearize implementation (integer pow) +// FIXME bt2020cl support (linearization between yuv/rgb step instead of between rgb/xyz) +// FIXME test that the values in (de)lin_lut don't exceed their container storage +// type size (only useful if we keep the LUT and don't move to fast integer pow) +// FIXME dithering if bitdepth goes down? +// FIXME bitexact for fate integration? + +/* + * All constants explained in e.g. https://linuxtv.org/downloads/v4l-dvb-apis/ch02s06.html + * The older ones (bt470bg/m) are also explained in their respective ITU docs + * (e.g. https://www.itu.int/dms_pubrec/itu-r/rec/bt/R-REC-BT.470-5-199802-S!!PDF-E.pdf) + * whereas the newer ones can typically be copied directly from wikipedia :) + */ +static const struct LumaCoefficients luma_coefficients[AVCOL_SPC_NB] = { + [AVCOL_SPC_FCC] = { 0.30, 0.59, 0.11 }, + [AVCOL_SPC_BT470BG] = { 0.299, 0.587, 0.114 }, + [AVCOL_SPC_SMPTE170M] = { 0.299, 0.587, 0.114 }, + [AVCOL_SPC_BT709] = { 0.2126, 0.7152, 0.0722 }, + [AVCOL_SPC_SMPTE240M] = { 0.212, 0.701, 0.087 }, + [AVCOL_SPC_BT2020_NCL] = { 0.2627, 0.6780, 0.0593 }, + [AVCOL_SPC_BT2020_CL] = { 0.2627, 0.6780, 0.0593 }, +}; + +static const struct LumaCoefficients *get_luma_coefficients(enum AVColorSpace csp) +{ + const struct LumaCoefficients *coeffs; + + if (csp >= AVCOL_SPC_NB) + return NULL; + coeffs = &luma_coefficients[csp]; + if (!coeffs->cr) + return NULL; + + return coeffs; +} + +static void fill_rgb2yuv_table(const struct LumaCoefficients *coeffs, + double rgb2yuv[3][3]) +{ + double bscale, rscale; + + rgb2yuv[0][0] = coeffs->cr; + rgb2yuv[0][1] = coeffs->cg; + rgb2yuv[0][2] = coeffs->cb; + bscale = 0.5 / (coeffs->cb - 1.0); + rscale = 0.5 / (coeffs->cr - 1.0); + rgb2yuv[1][0] = bscale * coeffs->cr; + rgb2yuv[1][1] = bscale * coeffs->cg; + rgb2yuv[1][2] = 0.5; + rgb2yuv[2][0] = 0.5; + rgb2yuv[2][1] = rscale * coeffs->cg; + rgb2yuv[2][2] = rscale * coeffs->cb; +} + +// FIXME I'm pretty sure gamma22/28 also have a linear toe slope, but I can't +// find any actual tables that document their real values... +// See http://www.13thmonkey.org/~boris/gammacorrection/ first graph why it matters +static const struct TransferCharacteristics transfer_characteristics[AVCOL_TRC_NB] = { + [AVCOL_TRC_BT709] = { 1.099, 0.018, 0.45, 4.5 }, + [AVCOL_TRC_GAMMA22] = { 1.0, 0.0, 1.0 / 2.2, 0.0 }, + [AVCOL_TRC_GAMMA28] = { 1.0, 0.0, 1.0 / 2.8, 0.0 }, + [AVCOL_TRC_SMPTE170M] = { 1.099, 0.018, 0.45, 4.5 }, + [AVCOL_TRC_SMPTE240M] = { 1.1115, 0.0228, 0.45, 4.0 }, + [AVCOL_TRC_BT2020_10] = { 1.099, 0.018, 0.45, 4.5 }, + [AVCOL_TRC_BT2020_12] = { 1.0993, 0.0181, 0.45, 4.5 }, +}; + +static const struct TransferCharacteristics * + get_transfer_characteristics(enum AVColorTransferCharacteristic trc) +{ + const struct TransferCharacteristics *coeffs; + + if (trc >= AVCOL_TRC_NB) + return NULL; + coeffs = &transfer_characteristics[trc]; + if (!coeffs->alpha) + return NULL; + + return coeffs; +} + +static const struct WhitepointCoefficients whitepoint_coefficients[WP_NB] = { + [WP_D65] = { 0.3127, 0.3290 }, + [WP_C] = { 0.3100, 0.3160 }, +}; + +static const struct ColorPrimaries color_primaries[AVCOL_PRI_NB] = { + [AVCOL_PRI_BT709] = { WP_D65, 0.640, 0.330, 0.300, 0.600, 0.150, 0.060 }, + [AVCOL_PRI_BT470M] = { WP_C, 0.670, 0.330, 0.210, 0.710, 0.140, 0.080 }, + [AVCOL_PRI_BT470BG] = { WP_D65, 0.640, 0.330, 0.290, 0.600, 0.150, 0.060,}, + [AVCOL_PRI_SMPTE170M] = { WP_D65, 0.630, 0.340, 0.310, 0.595, 0.155, 0.070 }, + [AVCOL_PRI_SMPTE240M] = { WP_D65, 0.630, 0.340, 0.310, 0.595, 0.155, 0.070 }, + [AVCOL_PRI_BT2020] = { WP_D65, 0.708, 0.292, 0.170, 0.797, 0.131, 0.046 }, +}; + +static const struct ColorPrimaries *get_color_primaries(enum AVColorPrimaries prm) +{ + const struct ColorPrimaries *coeffs; + + if (prm >= AVCOL_PRI_NB) + return NULL; + coeffs = &color_primaries[prm]; + if (!coeffs->xr) + return NULL; + + return coeffs; +} + +static void invert_matrix3x3(const double in[3][3], double out[3][3]) +{ + double m00 = in[0][0], m01 = in[0][1], m02 = in[0][2], + m10 = in[1][0], m11 = in[1][1], m12 = in[1][2], + m20 = in[2][0], m21 = in[2][1], m22 = in[2][2]; + int i, j; + double det; + + out[0][0] = (m11 * m22 - m21 * m12); + out[0][1] = -(m01 * m22 - m21 * m02); + out[0][2] = (m01 * m12 - m11 * m02); + out[1][0] = -(m10 * m22 - m20 * m12); + out[1][1] = (m00 * m22 - m20 * m02); + out[1][2] = -(m00 * m12 - m10 * m02); + out[2][0] = (m10 * m21 - m20 * m11); + out[2][1] = -(m00 * m21 - m20 * m01); + out[2][2] = (m00 * m11 - m10 * m01); + + det = m00 * out[0][0] + m10 * out[0][1] + m20 * out[0][2]; + det = 1.0 / det; + + for (i = 0; i < 3; i++) { + for (j = 0; j < 3; j++) + out[i][j] *= det; + } +} + +static int fill_gamma_table(ColorSpaceContext *s) +{ + int n; + double in_alpha = s->in_txchr->alpha, in_beta = s->in_txchr->beta; + double in_gamma = s->in_txchr->gamma, in_delta = s->in_txchr->delta; + double in_ialpha = 1.0 / in_alpha, in_igamma = 1.0 / in_gamma, in_idelta = 1.0 / in_delta; + double out_alpha = s->out_txchr->alpha, out_beta = s->out_txchr->beta; + double out_gamma = s->out_txchr->gamma, out_delta = s->out_txchr->delta; + + s->lin_lut = av_malloc(sizeof(*s->lin_lut) * 32768 * 2); + if (!s->lin_lut) + return AVERROR(ENOMEM); + s->delin_lut = &s->lin_lut[32768]; + for (n = 0; n < 32768; n++) { + double v = (n - 2048.0) / 28672.0, d, l; + + // delinearize + if (v <= -out_beta) { + d = -out_alpha * pow(-v, out_gamma) + (out_alpha - 1.0); + } else if (v < out_beta) { + d = out_delta * v; + } else { + d = out_alpha * pow(v, out_gamma) - (out_alpha - 1.0); + } + s->delin_lut[n] = av_clip_int16(lrint(d * 28672.0)); + + // linearize + if (v <= -in_beta) { + l = -pow((1.0 - in_alpha - v) * in_ialpha, in_igamma); + } else if (v < in_beta) { + l = v * in_idelta; + } else { + l = pow((v + in_alpha - 1.0) * in_ialpha, in_igamma); + } + s->lin_lut[n] = av_clip_int16(lrint(l * 28672.0)); + } + + return 0; +} + +/* + * see e.g. http://www.brucelindbloom.com/index.html?Eqn_RGB_XYZ_Matrix.html + */ +static void fill_rgb2xyz_table(const struct ColorPrimaries *coeffs, + double rgb2xyz[3][3]) +{ + const struct WhitepointCoefficients *wp = &whitepoint_coefficients[coeffs->wp]; + double i[3][3], sr, sg, sb, zw; + + rgb2xyz[0][0] = coeffs->xr / coeffs->yr; + rgb2xyz[0][1] = coeffs->xg / coeffs->yg; + rgb2xyz[0][2] = coeffs->xb / coeffs->yb; + rgb2xyz[1][0] = rgb2xyz[1][1] = rgb2xyz[1][2] = 1.0; + rgb2xyz[2][0] = (1.0 - coeffs->xr - coeffs->yr) / coeffs->yr; + rgb2xyz[2][1] = (1.0 - coeffs->xg - coeffs->yg) / coeffs->yg; + rgb2xyz[2][2] = (1.0 - coeffs->xb - coeffs->yb) / coeffs->yb; + invert_matrix3x3(rgb2xyz, i); + zw = 1.0 - wp->xw - wp->yw; + sr = i[0][0] * wp->xw + i[0][1] * wp->yw + i[0][2] * zw; + sg = i[1][0] * wp->xw + i[1][1] * wp->yw + i[1][2] * zw; + sb = i[2][0] * wp->xw + i[2][1] * wp->yw + i[2][2] * zw; + rgb2xyz[0][0] *= sr; + rgb2xyz[0][1] *= sg; + rgb2xyz[0][2] *= sb; + rgb2xyz[1][0] *= sr; + rgb2xyz[1][1] *= sg; + rgb2xyz[1][2] *= sb; + rgb2xyz[2][0] *= sr; + rgb2xyz[2][1] *= sg; + rgb2xyz[2][2] *= sb; +} + +static void mul3x3(double dst[3][3], const double src1[3][3], const double src2[3][3]) +{ + int m, n; + + for (m = 0; m < 3; m++) + for (n = 0; n < 3; n++) + dst[m][n] = src2[m][0] * src1[0][n] + + src2[m][1] * src1[1][n] + + src2[m][2] * src1[2][n]; +} + +/* + * See http://www.brucelindbloom.com/index.html?Eqn_ChromAdapt.html + * This function uses the Bradford mechanism. + */ +static void fill_whitepoint_conv_table(double out[3][3], + enum Whitepoint src, enum Whitepoint dst) +{ + static const double ma[3][3] = { + { 0.8951, 0.2664, -0.1614 }, + { -0.7502, 1.7135, 0.0367 }, + { 0.0389, -0.0685, 1.0296 }, + }; + const struct WhitepointCoefficients *wp_src = &whitepoint_coefficients[src]; + double zw_src = 1.0 - wp_src->xw - wp_src->yw; + const struct WhitepointCoefficients *wp_dst = &whitepoint_coefficients[dst]; + double zw_dst = 1.0 - wp_dst->xw - wp_dst->yw; + double mai[3][3], fac[3][3], tmp[3][3]; + double rs, gs, bs, rd, gd, bd; + + invert_matrix3x3(ma, mai); + rs = ma[0][0] * wp_src->xw + ma[0][1] * wp_src->yw + ma[0][2] * zw_src; + gs = ma[1][0] * wp_src->xw + ma[1][1] * wp_src->yw + ma[1][2] * zw_src; + bs = ma[2][0] * wp_src->xw + ma[2][1] * wp_src->yw + ma[2][2] * zw_src; + rd = ma[0][0] * wp_dst->xw + ma[0][1] * wp_dst->yw + ma[0][2] * zw_dst; + gd = ma[1][0] * wp_dst->xw + ma[1][1] * wp_dst->yw + ma[1][2] * zw_dst; + bd = ma[2][0] * wp_dst->xw + ma[2][1] * wp_dst->yw + ma[2][2] * zw_dst; + fac[0][0] = rd / rs; + fac[1][1] = gd / gs; + fac[2][2] = bd / bs; + fac[0][1] = fac[0][2] = fac[1][0] = fac[1][2] = fac[2][0] = fac[2][1] = 0.0; + mul3x3(tmp, ma, fac); + mul3x3(out, tmp, mai); +} + +static void apply_lut(int16_t *buf[3], ptrdiff_t stride, + int w, int h, const int16_t *lut) +{ + int y, x, n; + + for (n = 0; n < 3; n++) { + int16_t *data = buf[n]; + + for (y = 0; y < h; y++) { + for (x = 0; x < w; x++) + data[x] = lut[av_clip_uintp2(2048 + data[x], 15)]; + + data += stride; + } + } +} + +struct ThreadData { + AVFrame *in, *out; + ptrdiff_t in_linesize[3], out_linesize[3]; + int in_ss_h, out_ss_h; +}; + +static int convert(AVFilterContext *ctx, void *data, int job_nr, int n_jobs) +{ + struct ThreadData *td = data; + ColorSpaceContext *s = ctx->priv; + uint8_t *in_data[3], *out_data[3]; + int16_t *rgb[3]; + int h_in = (td->in->height + 1) >> 1; + int h1 = 2 * (job_nr * h_in / n_jobs), h2 = 2 * ((job_nr + 1) * h_in / n_jobs); + int w = td->in->width, h = h2 - h1; + + in_data[0] = td->in->data[0] + td->in_linesize[0] * h1; + in_data[1] = td->in->data[1] + td->in_linesize[1] * (h1 >> td->in_ss_h); + in_data[2] = td->in->data[2] + td->in_linesize[2] * (h1 >> td->in_ss_h); + out_data[0] = td->out->data[0] + td->out_linesize[0] * h1; + out_data[1] = td->out->data[1] + td->out_linesize[1] * (h1 >> td->out_ss_h); + out_data[2] = td->out->data[2] + td->out_linesize[2] * (h1 >> td->out_ss_h); + rgb[0] = s->rgb[0] + s->rgb_stride * h1; + rgb[1] = s->rgb[1] + s->rgb_stride * h1; + rgb[2] = s->rgb[2] + s->rgb_stride * h1; + + // FIXME for simd, also make sure we do pictures with negative stride + // top-down so we don't overwrite lines with padding of data before it + // in the same buffer (same as swscale) + + if (s->yuv2yuv_fastmode) { + // FIXME possibly use a fast mode in case only the y range changes? + // since in that case, only the diagonal entries in yuv2yuv_coeffs[] + // are non-zero + s->yuv2yuv(out_data, td->out_linesize, in_data, td->in_linesize, w, h, + s->yuv2yuv_coeffs, s->yuv_offset); + } else { + // FIXME maybe (for caching effciency) do pipeline per-line instead of + // full buffer per function? (Or, since yuv2rgb requires 2 lines: per + // 2 lines, for yuv420.) + /* + * General design: + * - yuv2rgb converts from whatever range the input was ([16-235/240] or + * [0,255] or the 10/12bpp equivalents thereof) to an integer version + * of RGB in psuedo-restricted 15+sign bits. That means that the float + * range [0.0,1.0] is in [0,28762], and the remainder of the int16_t + * range is used for overflow/underflow outside the representable + * range of this RGB type. rgb2yuv is the exact opposite. + * - gamma correction is done using a LUT since that appears to work + * fairly fast. + * - If the input is chroma-subsampled (420/422), the yuv2rgb conversion + * (or rgb2yuv conversion) uses nearest-neighbour sampling to read + * read chroma pixels at luma resolution. If you want some more fancy + * filter, you can use swscale to convert to yuv444p. + * - all coefficients are 14bit (so in the [-2.0,2.0] range). + */ + s->yuv2rgb(rgb, s->rgb_stride, in_data, td->in_linesize, w, h, + s->yuv2rgb_coeffs, s->yuv_offset[0]); + if (!s->rgb2rgb_passthrough) { + apply_lut(rgb, s->rgb_stride, w, h, s->lin_lut); + if (!s->lrgb2lrgb_passthrough) + s->dsp.multiply3x3(rgb, s->rgb_stride, w, h, s->lrgb2lrgb_coeffs); + apply_lut(rgb, s->rgb_stride, w, h, s->delin_lut); + } + s->rgb2yuv(out_data, td->out_linesize, rgb, s->rgb_stride, w, h, + s->rgb2yuv_coeffs, s->yuv_offset[1]); + } + + return 0; +} + +static int get_range_off(int *off, int *y_rng, int *uv_rng, + enum AVColorRange rng, int depth) +{ + switch (rng) { + case AVCOL_RANGE_MPEG: + *off = 16 << (depth - 8); + *y_rng = 219 << (depth - 8); + *uv_rng = 224 << (depth - 8); + break; + case AVCOL_RANGE_JPEG: + *off = 0; + *y_rng = *uv_rng = (256 << (depth - 8)) - 1; + break; + default: + return AVERROR(EINVAL); + } + + return 0; +} + +static int create_filtergraph(AVFilterContext *ctx, + const AVFrame *in, const AVFrame *out) +{ + ColorSpaceContext *s = ctx->priv; + const AVPixFmtDescriptor *in_desc = av_pix_fmt_desc_get(in->format); + const AVPixFmtDescriptor *out_desc = av_pix_fmt_desc_get(out->format); + int emms = 0, m, n, o, res, fmt_identical, redo_yuv2rgb = 0, redo_rgb2yuv = 0; + +#define supported_depth(d) ((d) == 8 || (d) == 10 || (d) == 12) +#define supported_subsampling(lcw, lch) \ + (((lcw) == 0 && (lch) == 0) || ((lcw) == 1 && (lch) == 0) || ((lcw) == 1 && (lch) == 1)) +#define supported_format(d) \ + ((d) != NULL && (d)->nb_components == 3 && \ + !((d)->flags & AV_PIX_FMT_FLAG_RGB) && \ + supported_depth((d)->comp[0].depth) && \ + supported_subsampling((d)->log2_chroma_w, (d)->log2_chroma_h)) + + if (!supported_format(in_desc)) { + av_log(ctx, AV_LOG_ERROR, + "Unsupported input format %d (%s) or bitdepth (%d)\n", + in->format, av_get_pix_fmt_name(in->format), + in_desc ? in_desc->comp[0].depth : -1); + return AVERROR(EINVAL); + } + if (!supported_format(out_desc)) { + av_log(ctx, AV_LOG_ERROR, + "Unsupported output format %d (%s) or bitdepth (%d)\n", + out->format, av_get_pix_fmt_name(out->format), + out_desc ? out_desc->comp[0].depth : -1); + return AVERROR(EINVAL); + } + + if (in->color_primaries != s->in_prm) s->in_primaries = NULL; + if (out->color_primaries != s->out_prm) s->out_primaries = NULL; + if (in->color_trc != s->in_trc) s->in_txchr = NULL; + if (out->color_trc != s->out_trc) s->out_txchr = NULL; + if (in->colorspace != s->in_csp || + in->color_range != s->in_rng) s->in_lumacoef = NULL; + if (out->colorspace != s->out_csp || + out->color_range != s->out_rng) s->out_lumacoef = NULL; + + if (!s->out_primaries || !s->in_primaries) { + s->in_prm = in->color_primaries; + s->in_primaries = get_color_primaries(s->in_prm); + if (!s->in_primaries) { + av_log(ctx, AV_LOG_ERROR, + "Unsupported input primaries %d (%s)\n", + s->in_prm, av_color_primaries_name(s->in_prm)); + return AVERROR(EINVAL); + } + s->out_prm = out->color_primaries; + s->out_primaries = get_color_primaries(s->out_prm); + if (!s->out_primaries) { + if (s->out_prm == AVCOL_PRI_UNSPECIFIED) { + if (s->user_all == CS_UNSPECIFIED) { + av_log(ctx, AV_LOG_ERROR, "Please specify output primaries\n"); + } else { + av_log(ctx, AV_LOG_ERROR, + "Unsupported output color property %d\n", s->user_all); + } + } else { + av_log(ctx, AV_LOG_ERROR, + "Unsupported output primaries %d (%s)\n", + s->out_prm, av_color_primaries_name(s->out_prm)); + } + return AVERROR(EINVAL); + } + s->lrgb2lrgb_passthrough = !memcmp(s->in_primaries, s->out_primaries, + sizeof(*s->in_primaries)); + if (!s->lrgb2lrgb_passthrough) { + double rgb2xyz[3][3], xyz2rgb[3][3], rgb2rgb[3][3]; + + fill_rgb2xyz_table(s->out_primaries, rgb2xyz); + invert_matrix3x3(rgb2xyz, xyz2rgb); + fill_rgb2xyz_table(s->in_primaries, rgb2xyz); + if (s->out_primaries->wp != s->in_primaries->wp) { + double wpconv[3][3], tmp[3][3]; + + fill_whitepoint_conv_table(wpconv, s->in_primaries->wp, + s->out_primaries->wp); + mul3x3(tmp, rgb2xyz, wpconv); + mul3x3(rgb2rgb, tmp, xyz2rgb); + } else { + mul3x3(rgb2rgb, rgb2xyz, xyz2rgb); + } + for (m = 0; m < 3; m++) + for (n = 0; n < 3; n++) { + s->lrgb2lrgb_coeffs[m][n][0] = lrint(16384.0 * rgb2rgb[m][n]); + for (o = 1; o < 8; o++) + s->lrgb2lrgb_coeffs[m][n][o] = s->lrgb2lrgb_coeffs[m][n][0]; + } + + emms = 1; + } + } + + if (!s->in_txchr) { + av_freep(&s->lin_lut); + s->in_trc = in->color_trc; + s->in_txchr = get_transfer_characteristics(s->in_trc); + if (!s->in_txchr) { + av_log(ctx, AV_LOG_ERROR, + "Unsupported input transfer characteristics %d (%s)\n", + s->in_trc, av_color_transfer_name(s->in_trc)); + return AVERROR(EINVAL); + } + } + + if (!s->out_txchr) { + av_freep(&s->lin_lut); + s->out_trc = out->color_trc; + s->out_txchr = get_transfer_characteristics(s->out_trc); + if (!s->out_txchr) { + if (s->out_trc == AVCOL_TRC_UNSPECIFIED) { + if (s->user_all == CS_UNSPECIFIED) { + av_log(ctx, AV_LOG_ERROR, + "Please specify output transfer characteristics\n"); + } else { + av_log(ctx, AV_LOG_ERROR, + "Unsupported output color property %d\n", s->user_all); + } + } else { + av_log(ctx, AV_LOG_ERROR, + "Unsupported output transfer characteristics %d (%s)\n", + s->out_trc, av_color_transfer_name(s->out_trc)); + } + return AVERROR(EINVAL); + } + } + + s->rgb2rgb_passthrough = s->fast_mode || (s->lrgb2lrgb_passthrough && + !memcmp(s->in_txchr, s->out_txchr, sizeof(*s->in_txchr))); + if (!s->rgb2rgb_passthrough && !s->lin_lut) { + res = fill_gamma_table(s); + if (res < 0) + return res; + emms = 1; + } + + if (!s->in_lumacoef) { + s->in_csp = in->colorspace; + s->in_rng = in->color_range; + s->in_lumacoef = get_luma_coefficients(s->in_csp); + if (!s->in_lumacoef) { + av_log(ctx, AV_LOG_ERROR, + "Unsupported input colorspace %d (%s)\n", + s->in_csp, av_color_space_name(s->in_csp)); + return AVERROR(EINVAL); + } + redo_yuv2rgb = 1; + } + + if (!s->out_lumacoef) { + s->out_csp = out->colorspace; + s->out_rng = out->color_range; + s->out_lumacoef = get_luma_coefficients(s->out_csp); + if (!s->out_lumacoef) { + if (s->out_csp == AVCOL_SPC_UNSPECIFIED) { + if (s->user_all == CS_UNSPECIFIED) { + av_log(ctx, AV_LOG_ERROR, + "Please specify output transfer characteristics\n"); + } else { + av_log(ctx, AV_LOG_ERROR, + "Unsupported output color property %d\n", s->user_all); + } + } else { + av_log(ctx, AV_LOG_ERROR, + "Unsupported output transfer characteristics %d (%s)\n", + s->out_csp, av_color_space_name(s->out_csp)); + } + return AVERROR(EINVAL); + } + redo_rgb2yuv = 1; + } + + fmt_identical = in_desc->log2_chroma_h == out_desc->log2_chroma_h && + in_desc->log2_chroma_w == out_desc->log2_chroma_w; + s->yuv2yuv_fastmode = s->rgb2rgb_passthrough && fmt_identical; + s->yuv2yuv_passthrough = s->yuv2yuv_fastmode && s->in_rng == s->out_rng && + !memcmp(s->in_lumacoef, s->out_lumacoef, + sizeof(*s->in_lumacoef)); + if (!s->yuv2yuv_passthrough) { + if (redo_yuv2rgb) { + double rgb2yuv[3][3], (*yuv2rgb)[3] = s->yuv2rgb_dbl_coeffs; + int off, bits, in_rng; + + res = get_range_off(&off, &s->in_y_rng, &s->in_uv_rng, + s->in_rng, in_desc->comp[0].depth); + if (res < 0) { + av_log(ctx, AV_LOG_ERROR, + "Unsupported input color range %d (%s)\n", + s->in_rng, av_color_range_name(s->in_rng)); + return res; + } + for (n = 0; n < 8; n++) + s->yuv_offset[0][n] = off; + fill_rgb2yuv_table(s->in_lumacoef, rgb2yuv); + invert_matrix3x3(rgb2yuv, yuv2rgb); + bits = 1 << (in_desc->comp[0].depth - 1); + for (n = 0; n < 3; n++) { + for (in_rng = s->in_y_rng, m = 0; m < 3; m++, in_rng = s->in_uv_rng) { + s->yuv2rgb_coeffs[n][m][0] = lrint(28672 * bits * yuv2rgb[n][m] / in_rng); + for (o = 1; o < 8; o++) + s->yuv2rgb_coeffs[n][m][o] = s->yuv2rgb_coeffs[n][m][0]; + } + } + av_assert2(s->yuv2rgb_coeffs[0][1][0] == 0); + av_assert2(s->yuv2rgb_coeffs[2][2][0] == 0); + av_assert2(s->yuv2rgb_coeffs[0][0][0] == s->yuv2rgb_coeffs[1][0][0]); + av_assert2(s->yuv2rgb_coeffs[0][0][0] == s->yuv2rgb_coeffs[2][0][0]); + s->yuv2rgb = s->dsp.yuv2rgb[(in_desc->comp[0].depth - 8) >> 1] + [in_desc->log2_chroma_h + in_desc->log2_chroma_w]; + emms = 1; + } + + if (redo_rgb2yuv) { + double (*rgb2yuv)[3] = s->rgb2yuv_dbl_coeffs; + int off, out_rng, bits; + + res = get_range_off(&off, &s->out_y_rng, &s->out_uv_rng, + s->out_rng, out_desc->comp[0].depth); + if (res < 0) { + av_log(ctx, AV_LOG_ERROR, + "Unsupported output color range %d (%s)\n", + s->out_rng, av_color_range_name(s->out_rng)); + return res; + } + for (n = 0; n < 8; n++) + s->yuv_offset[1][n] = off; + fill_rgb2yuv_table(s->out_lumacoef, rgb2yuv); + bits = 1 << (29 - out_desc->comp[0].depth); + for (n = 0; n < 3; n++) { + for (out_rng = s->out_y_rng, m = 0; m < 3; m++, out_rng = s->out_uv_rng) { + s->rgb2yuv_coeffs[n][m][0] = lrint(bits * out_rng * rgb2yuv[n][m] / 28672); + for (o = 1; o < 8; o++) + s->rgb2yuv_coeffs[n][m][o] = s->rgb2yuv_coeffs[n][m][0]; + } + } + av_assert2(s->rgb2yuv_coeffs[1][2][0] == s->rgb2yuv_coeffs[2][0][0]); + s->rgb2yuv = s->dsp.rgb2yuv[(out_desc->comp[0].depth - 8) >> 1] + [out_desc->log2_chroma_h + out_desc->log2_chroma_w]; + emms = 1; + } + + if (s->yuv2yuv_fastmode && (redo_yuv2rgb || redo_rgb2yuv)) { + int idepth = in_desc->comp[0].depth, odepth = out_desc->comp[0].depth; + double (*rgb2yuv)[3] = s->rgb2yuv_dbl_coeffs; + double (*yuv2rgb)[3] = s->yuv2rgb_dbl_coeffs; + double yuv2yuv[3][3]; + int in_rng, out_rng; + + mul3x3(yuv2yuv, yuv2rgb, rgb2yuv); + for (out_rng = s->out_y_rng, m = 0; m < 3; m++, out_rng = s->out_uv_rng) { + for (in_rng = s->in_y_rng, n = 0; n < 3; n++, in_rng = s->in_uv_rng) { + s->yuv2yuv_coeffs[m][n][0] = + lrint(16384 * yuv2yuv[m][n] * out_rng * (1 << idepth) / + (in_rng * (1 << odepth))); + for (o = 1; o < 8; o++) + s->yuv2yuv_coeffs[m][n][o] = s->yuv2yuv_coeffs[m][n][0]; + } + } + av_assert2(s->yuv2yuv_coeffs[1][0][0] == 0); + av_assert2(s->yuv2yuv_coeffs[2][0][0] == 0); + s->yuv2yuv = s->dsp.yuv2yuv[(idepth - 8) >> 1][(odepth - 8) >> 1] + [in_desc->log2_chroma_h + in_desc->log2_chroma_w]; + } + } + + if (emms) + emms_c(); + + return 0; +} + +static int init(AVFilterContext *ctx) +{ + ColorSpaceContext *s = ctx->priv; + + ff_colorspacedsp_init(&s->dsp); + + return 0; +} + +static void uninit(AVFilterContext *ctx) +{ + ColorSpaceContext *s = ctx->priv; + + av_freep(&s->rgb[0]); + av_freep(&s->rgb[1]); + av_freep(&s->rgb[2]); + s->rgb_sz = 0; + + av_freep(&s->lin_lut); +} + +static int filter_frame(AVFilterLink *link, AVFrame *in) +{ + AVFilterContext *ctx = link->dst; + AVFilterLink *outlink = ctx->outputs[0]; + ColorSpaceContext *s = ctx->priv; + // FIXME if yuv2yuv_passthrough, don't get a new buffer but use the + // input one if it is writable *OR* the actual literal values of in_* + // and out_* are identical (not just their respective properties) + AVFrame *out = ff_get_video_buffer(outlink, outlink->w, outlink->h); + int res; + ptrdiff_t rgb_stride = FFALIGN(in->width * sizeof(int16_t), 32); + unsigned rgb_sz = rgb_stride * in->height; + struct ThreadData td; + + if (!out) { + av_frame_free(&in); + return AVERROR(ENOMEM); + } + av_frame_copy_props(out, in); + + out->color_primaries = s->user_prm == AVCOL_PRI_UNSPECIFIED ? + default_prm[FFMIN(s->user_all, CS_NB)] : s->user_prm; + if (s->user_trc == AVCOL_TRC_UNSPECIFIED) { + const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(out->format); + + out->color_trc = default_trc[FFMIN(s->user_all, CS_NB)]; + if (out->color_trc == AVCOL_TRC_BT2020_10 && desc && desc->comp[0].depth >= 12) + out->color_trc = AVCOL_TRC_BT2020_12; + } else { + out->color_trc = s->user_trc; + } + out->colorspace = s->user_csp == AVCOL_SPC_UNSPECIFIED ? + default_csp[FFMIN(s->user_all, CS_NB)] : s->user_csp; + out->color_range = s->user_rng == AVCOL_RANGE_UNSPECIFIED ? + in->color_range : s->user_rng; + if (rgb_sz != s->rgb_sz) { + av_freep(&s->rgb[0]); + av_freep(&s->rgb[1]); + av_freep(&s->rgb[2]); + s->rgb_sz = 0; + + s->rgb[0] = av_malloc(rgb_sz); + s->rgb[1] = av_malloc(rgb_sz); + s->rgb[2] = av_malloc(rgb_sz); + if (!s->rgb[0] || !s->rgb[1] || !s->rgb[2]) { + uninit(ctx); + return AVERROR(ENOMEM); + } + s->rgb_sz = rgb_sz; + } + res = create_filtergraph(ctx, in, out); + if (res < 0) + return res; + s->rgb_stride = rgb_stride / sizeof(int16_t); + td.in = in; + td.out = out; + td.in_linesize[0] = in->linesize[0]; + td.in_linesize[1] = in->linesize[1]; + td.in_linesize[2] = in->linesize[2]; + td.out_linesize[0] = out->linesize[0]; + td.out_linesize[1] = out->linesize[1]; + td.out_linesize[2] = out->linesize[2]; + td.in_ss_h = av_pix_fmt_desc_get(in->format)->log2_chroma_h; + td.out_ss_h = av_pix_fmt_desc_get(out->format)->log2_chroma_h; + if (s->yuv2yuv_passthrough) { + av_frame_copy(out, in); + } else { + ctx->internal->execute(ctx, convert, &td, NULL, + FFMIN((in->height + 1) >> 1, ctx->graph->nb_threads)); + } + av_frame_free(&in); + + return ff_filter_frame(outlink, out); +} + +static int query_formats(AVFilterContext *ctx) +{ + static const enum AVPixelFormat pix_fmts[] = { + AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV422P, AV_PIX_FMT_YUV444P, + AV_PIX_FMT_YUV420P10, AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV444P10, + AV_PIX_FMT_YUV420P12, AV_PIX_FMT_YUV422P12, AV_PIX_FMT_YUV444P12, + AV_PIX_FMT_NONE + }; + int res; + ColorSpaceContext *s = ctx->priv; + AVFilterFormats *formats = ff_make_format_list(pix_fmts); + + if (!formats) + return AVERROR(ENOMEM); + if (s->user_format == AV_PIX_FMT_NONE) + return ff_set_common_formats(ctx, formats); + res = ff_formats_ref(formats, &ctx->inputs[0]->out_formats); + if (res < 0) + return res; + formats = NULL; + res = ff_add_format(&formats, s->user_format); + if (res < 0) + return res; + + return ff_formats_ref(formats, &ctx->outputs[0]->in_formats); +} + +static int config_props(AVFilterLink *outlink) +{ + AVFilterLink *inlink = outlink->src->inputs[0]; + + outlink->w = inlink->w; + outlink->h = inlink->h; + outlink->sample_aspect_ratio = inlink->sample_aspect_ratio; + outlink->time_base = inlink->time_base; + + return 0; +} + +#define OFFSET(x) offsetof(ColorSpaceContext, x) +#define FLAGS AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_VIDEO_PARAM +#define ENUM(x, y, z) { x, "", 0, AV_OPT_TYPE_CONST, { .i64 = y }, INT_MIN, INT_MAX, FLAGS, z } + +static const AVOption colorspace_options[] = { + { "all", "Set all color properties together", + OFFSET(user_all), AV_OPT_TYPE_INT, { .i64 = CS_UNSPECIFIED }, + CS_UNSPECIFIED, CS_NB - 1, FLAGS, "all" }, + ENUM("bt470m", CS_BT470M, "all"), + ENUM("bt470bg", CS_BT470BG, "all"), + ENUM("bt601-6-525", CS_BT601_6_525, "all"), + ENUM("bt601-6-625", CS_BT601_6_625, "all"), + ENUM("bt709", CS_BT709, "all"), + ENUM("smpte170m", CS_SMPTE170M, "all"), + ENUM("smpte240m", CS_SMPTE240M, "all"), + ENUM("bt2020", CS_BT2020, "all"), + + { "space", "Output colorspace", + OFFSET(user_csp), AV_OPT_TYPE_INT, { .i64 = AVCOL_SPC_UNSPECIFIED }, + AVCOL_PRI_RESERVED0, AVCOL_PRI_NB - 1, FLAGS, "csp" }, + ENUM("bt709", AVCOL_SPC_BT709, "csp"), + ENUM("fcc", AVCOL_SPC_FCC, "csp"), + ENUM("bt470bg", AVCOL_SPC_BT470BG, "csp"), + ENUM("smpte170m", AVCOL_SPC_SMPTE170M, "csp"), + ENUM("smpte240m", AVCOL_SPC_SMPTE240M, "csp"), + ENUM("bt2020ncl", AVCOL_SPC_BT2020_NCL, "csp"), + + { "range", "Output color range", + OFFSET(user_rng), AV_OPT_TYPE_INT, { .i64 = AVCOL_RANGE_UNSPECIFIED }, + AVCOL_RANGE_UNSPECIFIED, AVCOL_RANGE_NB - 1, FLAGS, "rng" }, + ENUM("mpeg", AVCOL_RANGE_MPEG, "rng"), + ENUM("jpeg", AVCOL_RANGE_JPEG, "rng"), + + { "primaries", "Output color primaries", + OFFSET(user_prm), AV_OPT_TYPE_INT, { .i64 = AVCOL_PRI_UNSPECIFIED }, + AVCOL_PRI_RESERVED0, AVCOL_PRI_NB - 1, FLAGS, "prm" }, + ENUM("bt709", AVCOL_PRI_BT709, "prm"), + ENUM("bt470m", AVCOL_PRI_BT470M, "prm"), + ENUM("bt470bg", AVCOL_PRI_BT470BG, "prm"), + ENUM("smpte170m", AVCOL_PRI_SMPTE170M, "prm"), + ENUM("smpte240m", AVCOL_PRI_SMPTE240M, "prm"), + ENUM("bt2020", AVCOL_PRI_BT2020, "prm"), + + { "trc", "Output transfer characteristics", + OFFSET(user_trc), AV_OPT_TYPE_INT, { .i64 = AVCOL_TRC_UNSPECIFIED }, + AVCOL_TRC_RESERVED0, AVCOL_TRC_NB - 1, FLAGS, "trc" }, + ENUM("bt709", AVCOL_TRC_BT709, "trc"), + ENUM("gamma22", AVCOL_TRC_GAMMA22, "trc"), + ENUM("gamma28", AVCOL_TRC_GAMMA28, "trc"), + ENUM("smpte170m", AVCOL_TRC_SMPTE170M, "trc"), + ENUM("smpte240m", AVCOL_TRC_SMPTE240M, "trc"), + ENUM("bt2020-10", AVCOL_TRC_BT2020_10, "trc"), + ENUM("bt2020-12", AVCOL_TRC_BT2020_12, "trc"), + + { "format", "Output pixel format", + OFFSET(user_format), AV_OPT_TYPE_INT, { .i64 = AV_PIX_FMT_NONE }, + AV_PIX_FMT_NONE, AV_PIX_FMT_GBRAP12LE, FLAGS, "fmt" }, + ENUM("yuv420p", AV_PIX_FMT_YUV420P, "fmt"), + ENUM("yuv420p10", AV_PIX_FMT_YUV420P10, "fmt"), + ENUM("yuv420p12", AV_PIX_FMT_YUV420P12, "fmt"), + ENUM("yuv422p", AV_PIX_FMT_YUV422P, "fmt"), + ENUM("yuv422p10", AV_PIX_FMT_YUV422P10, "fmt"), + ENUM("yuv422p12", AV_PIX_FMT_YUV422P12, "fmt"), + ENUM("yuv444p", AV_PIX_FMT_YUV444P, "fmt"), + ENUM("yuv444p10", AV_PIX_FMT_YUV444P10, "fmt"), + ENUM("yuv444p12", AV_PIX_FMT_YUV444P12, "fmt"), + + { "fast", "Ignore primary chromaticity and gamma correction", + OFFSET(fast_mode), AV_OPT_TYPE_BOOL, { .i64 = 0 }, + 0, 1, FLAGS }, + { NULL } +}; + +AVFILTER_DEFINE_CLASS(colorspace); + +static const AVFilterPad inputs[] = { + { + .name = "default", + .type = AVMEDIA_TYPE_VIDEO, + .filter_frame = filter_frame, + }, + { NULL } +}; + +static const AVFilterPad outputs[] = { + { + .name = "default", + .type = AVMEDIA_TYPE_VIDEO, + .config_props = config_props, + }, + { NULL } +}; + +AVFilter ff_vf_colorspace = { + .name = "colorspace", + .description = NULL_IF_CONFIG_SMALL("Convert between colorspaces."), + .init = init, + .uninit = uninit, + .query_formats = query_formats, + .priv_size = sizeof(ColorSpaceContext), + .priv_class = &colorspace_class, + .inputs = inputs, + .outputs = outputs, + .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC | AVFILTER_FLAG_SLICE_THREADS, +}; -- cgit v1.2.3