mirror of
https://github.com/librempeg/librempeg
synced 2024-11-22 00:51:37 +00:00
7d8a5e3aee
And preserve the public SwsContext as separate name. The motivation here is that I want to turn SwsContext into a public struct, while keeping the internal implementation hidden. Additionally, I also want to be able to use multiple internal implementations, e.g. for GPU devices. This commit does not include any functional changes. For the most part, it is a simple rename. The only complications arise from the public facing API functions, which preserve their current type (and hence require an additional unwrapping step internally), and the checkasm test framework, which directly accesses SwsInternal. For consistency, the affected functions that need to maintain a distionction have generally been changed to refer to the SwsContext as *sws, and the SwsInternal as *c. In an upcoming commit, I will provide a backing definition for the public SwsContext, and update `sws_internal()` to dereference the internal struct instead of merely casting it. Sponsored-by: Sovereign Tech Fund Signed-off-by: Niklas Haas <git@haasn.dev> Signed-off-by: Paul B Mahol <onemda@gmail.com>
242 lines
8.8 KiB
C
242 lines
8.8 KiB
C
/*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with FFmpeg; if not, write to the Free Software Foundation, Inc.,
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*/
|
|
|
|
#include <string.h>
|
|
|
|
#include "libavutil/common.h"
|
|
#include "libavutil/intreadwrite.h"
|
|
#include "libavutil/mem_internal.h"
|
|
#include "libavutil/pixdesc.h"
|
|
|
|
#include "libswscale/swscale.h"
|
|
#include "libswscale/swscale_internal.h"
|
|
|
|
#include "checkasm.h"
|
|
|
|
#define randomize_buffers(buf, size) \
|
|
do { \
|
|
for (int j = 0; j < size; j += 4) \
|
|
AV_WN32(buf + j, rnd()); \
|
|
} while (0)
|
|
|
|
static const int dst_fmts[] = {
|
|
// AV_PIX_FMT_BGR48BE,
|
|
// AV_PIX_FMT_BGR48LE,
|
|
// AV_PIX_FMT_RGB48BE,
|
|
// AV_PIX_FMT_RGB48LE,
|
|
AV_PIX_FMT_ARGB,
|
|
AV_PIX_FMT_ABGR,
|
|
AV_PIX_FMT_RGBA,
|
|
AV_PIX_FMT_BGRA,
|
|
AV_PIX_FMT_RGB24,
|
|
AV_PIX_FMT_BGR24,
|
|
AV_PIX_FMT_RGB565,
|
|
AV_PIX_FMT_BGR565,
|
|
AV_PIX_FMT_RGB555,
|
|
AV_PIX_FMT_BGR555,
|
|
// AV_PIX_FMT_RGB444,
|
|
// AV_PIX_FMT_BGR444,
|
|
// AV_PIX_FMT_RGB8,
|
|
// AV_PIX_FMT_BGR8,
|
|
// AV_PIX_FMT_RGB4,
|
|
// AV_PIX_FMT_BGR4,
|
|
// AV_PIX_FMT_RGB4_BYTE,
|
|
// AV_PIX_FMT_BGR4_BYTE,
|
|
// AV_PIX_FMT_MONOBLACK,
|
|
AV_PIX_FMT_GBRP,
|
|
};
|
|
|
|
static int cmp_off_by_n(const uint8_t *ref, const uint8_t *test, size_t n, int accuracy)
|
|
{
|
|
for (size_t i = 0; i < n; i++) {
|
|
if (abs(ref[i] - test[i]) > accuracy)
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static int cmp_555_by_n(const uint8_t *ref, const uint8_t *test, size_t n, int accuracy)
|
|
{
|
|
const uint16_t *ref16 = (const uint16_t *) ref;
|
|
const uint16_t *test16 = (const uint16_t *) test;
|
|
for (size_t i = 0; i < n; i++) {
|
|
if (abs(( ref16[i] & 0x1f) - ( test16[i] & 0x1f)) > accuracy)
|
|
return 1;
|
|
if (abs(((ref16[i] >> 5) & 0x1f) - ((test16[i] >> 5) & 0x1f)) > accuracy)
|
|
return 1;
|
|
if (abs(((ref16[i] >> 10) & 0x1f) - ((test16[i] >> 10) & 0x1f)) > accuracy)
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static int cmp_565_by_n(const uint8_t *ref, const uint8_t *test, size_t n, int accuracy)
|
|
{
|
|
const uint16_t *ref16 = (const uint16_t *) ref;
|
|
const uint16_t *test16 = (const uint16_t *) test;
|
|
for (size_t i = 0; i < n; i++) {
|
|
if (abs(( ref16[i] & 0x1f) - ( test16[i] & 0x1f)) > accuracy)
|
|
return 1;
|
|
if (abs(((ref16[i] >> 5) & 0x3f) - ((test16[i] >> 5) & 0x3f)) > accuracy)
|
|
return 1;
|
|
if (abs(((ref16[i] >> 11) & 0x1f) - ((test16[i] >> 11) & 0x1f)) > accuracy)
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static void check_yuv2rgb(int src_pix_fmt)
|
|
{
|
|
const AVPixFmtDescriptor *src_desc = av_pix_fmt_desc_get(src_pix_fmt);
|
|
#define MAX_LINE_SIZE 1920
|
|
static const int input_sizes[] = {8, 128, 1080, MAX_LINE_SIZE};
|
|
|
|
declare_func_emms(AV_CPU_FLAG_MMX | AV_CPU_FLAG_MMXEXT,
|
|
int, SwsInternal *c, const uint8_t *src[],
|
|
int srcStride[], int srcSliceY, int srcSliceH,
|
|
uint8_t *dst[], int dstStride[]);
|
|
|
|
LOCAL_ALIGNED_8(uint8_t, src_y, [MAX_LINE_SIZE * 2]);
|
|
LOCAL_ALIGNED_8(uint8_t, src_u, [MAX_LINE_SIZE]);
|
|
LOCAL_ALIGNED_8(uint8_t, src_v, [MAX_LINE_SIZE]);
|
|
LOCAL_ALIGNED_8(uint8_t, src_a, [MAX_LINE_SIZE * 2]);
|
|
const uint8_t *src[4] = { src_y, src_u, src_v, src_a };
|
|
|
|
LOCAL_ALIGNED_8(uint8_t, dst0_0, [2 * MAX_LINE_SIZE * 6]);
|
|
LOCAL_ALIGNED_8(uint8_t, dst0_1, [2 * MAX_LINE_SIZE]);
|
|
LOCAL_ALIGNED_8(uint8_t, dst0_2, [2 * MAX_LINE_SIZE]);
|
|
uint8_t *dst0[4] = { dst0_0, dst0_1, dst0_2 };
|
|
uint8_t *lines0[4][2] = {
|
|
{ dst0_0, dst0_0 + MAX_LINE_SIZE * 6 },
|
|
{ dst0_1, dst0_1 + MAX_LINE_SIZE },
|
|
{ dst0_2, dst0_2 + MAX_LINE_SIZE }
|
|
};
|
|
|
|
LOCAL_ALIGNED_8(uint8_t, dst1_0, [2 * MAX_LINE_SIZE * 6]);
|
|
LOCAL_ALIGNED_8(uint8_t, dst1_1, [2 * MAX_LINE_SIZE]);
|
|
LOCAL_ALIGNED_8(uint8_t, dst1_2, [2 * MAX_LINE_SIZE]);
|
|
uint8_t *dst1[4] = { dst1_0, dst1_1, dst1_2 };
|
|
uint8_t *lines1[4][2] = {
|
|
{ dst1_0, dst1_0 + MAX_LINE_SIZE * 6 },
|
|
{ dst1_1, dst1_1 + MAX_LINE_SIZE },
|
|
{ dst1_2, dst1_2 + MAX_LINE_SIZE }
|
|
};
|
|
|
|
randomize_buffers(src_y, MAX_LINE_SIZE * 2);
|
|
randomize_buffers(src_u, MAX_LINE_SIZE);
|
|
randomize_buffers(src_v, MAX_LINE_SIZE);
|
|
randomize_buffers(src_a, MAX_LINE_SIZE * 2);
|
|
|
|
for (int dfi = 0; dfi < FF_ARRAY_ELEMS(dst_fmts); dfi++) {
|
|
int dst_pix_fmt = dst_fmts[dfi];
|
|
const AVPixFmtDescriptor *dst_desc = av_pix_fmt_desc_get(dst_pix_fmt);
|
|
int sample_size = av_get_padded_bits_per_pixel(dst_desc) >> 3;
|
|
for (int isi = 0; isi < FF_ARRAY_ELEMS(input_sizes); isi++) {
|
|
SwsContext *sws;
|
|
SwsInternal *c;
|
|
int log_level;
|
|
int width = input_sizes[isi];
|
|
int srcSliceY = 0;
|
|
int srcSliceH = 2;
|
|
int srcStride[4] = {
|
|
width,
|
|
width >> src_desc->log2_chroma_w,
|
|
width >> src_desc->log2_chroma_w,
|
|
width,
|
|
};
|
|
int dstStride[4] = {
|
|
MAX_LINE_SIZE * 6,
|
|
MAX_LINE_SIZE,
|
|
MAX_LINE_SIZE,
|
|
};
|
|
|
|
// override log level to prevent spamming of the message
|
|
// "No accelerated colorspace conversion found from %s to %s"
|
|
log_level = av_log_get_level();
|
|
av_log_set_level(AV_LOG_ERROR);
|
|
sws = sws_getContext(width, srcSliceH, src_pix_fmt,
|
|
width, srcSliceH, dst_pix_fmt,
|
|
0, NULL, NULL, NULL);
|
|
av_log_set_level(log_level);
|
|
if (!sws)
|
|
fail();
|
|
|
|
c = sws_internal(sws);
|
|
if (check_func(c->convert_unscaled, "%s_%s_%d", src_desc->name, dst_desc->name, width)) {
|
|
memset(dst0_0, 0xFF, 2 * MAX_LINE_SIZE * 6);
|
|
memset(dst1_0, 0xFF, 2 * MAX_LINE_SIZE * 6);
|
|
if (dst_pix_fmt == AV_PIX_FMT_GBRP) {
|
|
memset(dst0_1, 0xFF, MAX_LINE_SIZE);
|
|
memset(dst0_2, 0xFF, MAX_LINE_SIZE);
|
|
memset(dst1_1, 0xFF, MAX_LINE_SIZE);
|
|
memset(dst1_2, 0xFF, MAX_LINE_SIZE);
|
|
}
|
|
|
|
call_ref(c, src, srcStride, srcSliceY,
|
|
srcSliceH, dst0, dstStride);
|
|
call_new(c, src, srcStride, srcSliceY,
|
|
srcSliceH, dst1, dstStride);
|
|
|
|
if (dst_pix_fmt == AV_PIX_FMT_ARGB ||
|
|
dst_pix_fmt == AV_PIX_FMT_ABGR ||
|
|
dst_pix_fmt == AV_PIX_FMT_RGBA ||
|
|
dst_pix_fmt == AV_PIX_FMT_BGRA ||
|
|
dst_pix_fmt == AV_PIX_FMT_RGB24 ||
|
|
dst_pix_fmt == AV_PIX_FMT_BGR24) {
|
|
if (cmp_off_by_n(lines0[0][0], lines1[0][0], width * sample_size, 3) ||
|
|
cmp_off_by_n(lines0[0][1], lines1[0][1], width * sample_size, 3))
|
|
fail();
|
|
} else if (dst_pix_fmt == AV_PIX_FMT_RGB565 ||
|
|
dst_pix_fmt == AV_PIX_FMT_BGR565) {
|
|
if (cmp_565_by_n(lines0[0][0], lines1[0][0], width, 2) ||
|
|
cmp_565_by_n(lines0[0][1], lines1[0][1], width, 2))
|
|
fail();
|
|
} else if (dst_pix_fmt == AV_PIX_FMT_RGB555 ||
|
|
dst_pix_fmt == AV_PIX_FMT_BGR555) {
|
|
if (cmp_555_by_n(lines0[0][0], lines1[0][0], width, 2) ||
|
|
cmp_555_by_n(lines0[0][1], lines1[0][1], width, 2))
|
|
fail();
|
|
} else if (dst_pix_fmt == AV_PIX_FMT_GBRP) {
|
|
for (int p = 0; p < 3; p++)
|
|
for (int l = 0; l < 2; l++)
|
|
if (cmp_off_by_n(lines0[p][l], lines1[p][l], width, 3))
|
|
fail();
|
|
} else {
|
|
fail();
|
|
}
|
|
|
|
bench_new(c, src, srcStride, srcSliceY,
|
|
srcSliceH, dst0, dstStride);
|
|
}
|
|
sws_freeContext(sws);
|
|
}
|
|
}
|
|
}
|
|
|
|
#undef MAX_LINE_SIZE
|
|
|
|
void checkasm_check_sw_yuv2rgb(void)
|
|
{
|
|
check_yuv2rgb(AV_PIX_FMT_YUV420P);
|
|
report("yuv420p");
|
|
check_yuv2rgb(AV_PIX_FMT_YUV422P);
|
|
report("yuv422p");
|
|
check_yuv2rgb(AV_PIX_FMT_YUVA420P);
|
|
report("yuva420p");
|
|
}
|