212 lines
		
	
	
		
			7.6 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			212 lines
		
	
	
		
			7.6 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * This file is part of FFmpeg.
 | |
|  *
 | |
|  * FFmpeg is free software; you can redistribute it and/or modify
 | |
|  * it under the terms of the GNU General Public License as published by
 | |
|  * the Free Software Foundation; either version 2 of the License, or
 | |
|  * (at your option) any later version.
 | |
|  *
 | |
|  * FFmpeg is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|  * GNU General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU General Public License along
 | |
|  * with FFmpeg; if not, write to the Free Software Foundation, Inc.,
 | |
|  * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
 | |
|  */
 | |
| 
 | |
| #include <string.h>
 | |
| 
 | |
| #include "libavutil/common.h"
 | |
| #include "libavutil/intreadwrite.h"
 | |
| #include "libavutil/mem_internal.h"
 | |
| #include "libavutil/pixdesc.h"
 | |
| 
 | |
| #include "libswscale/swscale.h"
 | |
| #include "libswscale/swscale_internal.h"
 | |
| 
 | |
| #include "checkasm.h"
 | |
| 
 | |
| #define randomize_buffers(buf, size)      \
 | |
|     do {                                  \
 | |
|         for (int j = 0; j < size; j += 4) \
 | |
|             AV_WN32(buf + j, rnd());      \
 | |
|     } while (0)
 | |
| 
 | |
| static const int dst_fmts[] = {
 | |
| //     AV_PIX_FMT_BGR48BE,
 | |
| //     AV_PIX_FMT_BGR48LE,
 | |
| //     AV_PIX_FMT_RGB48BE,
 | |
| //     AV_PIX_FMT_RGB48LE,
 | |
|     AV_PIX_FMT_ARGB,
 | |
|     AV_PIX_FMT_ABGR,
 | |
|     AV_PIX_FMT_RGBA,
 | |
|     AV_PIX_FMT_BGRA,
 | |
|     AV_PIX_FMT_RGB24,
 | |
|     AV_PIX_FMT_BGR24,
 | |
|     AV_PIX_FMT_RGB565,
 | |
|     AV_PIX_FMT_BGR565,
 | |
|     AV_PIX_FMT_RGB555,
 | |
|     AV_PIX_FMT_BGR555,
 | |
| //     AV_PIX_FMT_RGB444,
 | |
| //     AV_PIX_FMT_BGR444,
 | |
| //     AV_PIX_FMT_RGB8,
 | |
| //     AV_PIX_FMT_BGR8,
 | |
| //     AV_PIX_FMT_RGB4,
 | |
| //     AV_PIX_FMT_BGR4,
 | |
| //     AV_PIX_FMT_RGB4_BYTE,
 | |
| //     AV_PIX_FMT_BGR4_BYTE,
 | |
| //     AV_PIX_FMT_MONOBLACK,
 | |
| };
 | |
| 
 | |
| static int cmp_off_by_n(const uint8_t *ref, const uint8_t *test, size_t n, int accuracy)
 | |
| {
 | |
|     for (size_t i = 0; i < n; i++) {
 | |
|         if (abs(ref[i] - test[i]) > accuracy)
 | |
|             return 1;
 | |
|     }
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static int cmp_555_by_n(const uint8_t *ref, const uint8_t *test, size_t n, int accuracy)
 | |
| {
 | |
|     const uint16_t *ref16  = (const uint16_t *) ref;
 | |
|     const uint16_t *test16 = (const uint16_t *) test;
 | |
|     for (size_t i = 0; i < n; i++) {
 | |
|         if (abs(( ref16[i]        & 0x1f) - ( test16[i]        & 0x1f)) > accuracy)
 | |
|             return 1;
 | |
|         if (abs(((ref16[i] >>  5) & 0x1f) - ((test16[i] >>  5) & 0x1f)) > accuracy)
 | |
|             return 1;
 | |
|         if (abs(((ref16[i] >> 10) & 0x1f) - ((test16[i] >> 10) & 0x1f)) > accuracy)
 | |
|             return 1;
 | |
|     }
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static int cmp_565_by_n(const uint8_t *ref, const uint8_t *test, size_t n, int accuracy)
 | |
| {
 | |
|     const uint16_t *ref16  = (const uint16_t *) ref;
 | |
|     const uint16_t *test16 = (const uint16_t *) test;
 | |
|     for (size_t i = 0; i < n; i++) {
 | |
|         if (abs(( ref16[i]        & 0x1f) - ( test16[i]        & 0x1f)) > accuracy)
 | |
|             return 1;
 | |
|         if (abs(((ref16[i] >>  5) & 0x3f) - ((test16[i] >>  5) & 0x3f)) > accuracy)
 | |
|             return 1;
 | |
|         if (abs(((ref16[i] >> 11) & 0x1f) - ((test16[i] >> 11) & 0x1f)) > accuracy)
 | |
|             return 1;
 | |
|     }
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static void check_yuv2rgb(int src_pix_fmt)
 | |
| {
 | |
|     const AVPixFmtDescriptor *src_desc = av_pix_fmt_desc_get(src_pix_fmt);
 | |
| #define MAX_LINE_SIZE 1920
 | |
|     static const int input_sizes[] = {8, 128, 1080, MAX_LINE_SIZE};
 | |
| 
 | |
|     declare_func_emms(AV_CPU_FLAG_MMX | AV_CPU_FLAG_MMXEXT,
 | |
|                       int, SwsContext *c, const uint8_t *src[],
 | |
|                            int srcStride[], int srcSliceY, int srcSliceH,
 | |
|                            uint8_t *dst[], int dstStride[]);
 | |
| 
 | |
|     LOCAL_ALIGNED_8(uint8_t, src_y, [MAX_LINE_SIZE * 2]);
 | |
|     LOCAL_ALIGNED_8(uint8_t, src_u, [MAX_LINE_SIZE]);
 | |
|     LOCAL_ALIGNED_8(uint8_t, src_v, [MAX_LINE_SIZE]);
 | |
|     LOCAL_ALIGNED_8(uint8_t, src_a, [MAX_LINE_SIZE * 2]);
 | |
|     const uint8_t *src[4] = { src_y, src_u, src_v, src_a };
 | |
| 
 | |
|     LOCAL_ALIGNED_8(uint8_t, dst0_, [2 * MAX_LINE_SIZE * 6]);
 | |
|     uint8_t *dst0[4] = { dst0_ };
 | |
|     uint8_t *lines0[2] = { dst0_, dst0_ + MAX_LINE_SIZE * 6 };
 | |
| 
 | |
|     LOCAL_ALIGNED_8(uint8_t, dst1_, [2 * MAX_LINE_SIZE * 6]);
 | |
|     uint8_t *dst1[4] = { dst1_ };
 | |
|     uint8_t *lines1[2] = { dst1_, dst1_ + MAX_LINE_SIZE * 6 };
 | |
| 
 | |
|     randomize_buffers(src_y, MAX_LINE_SIZE * 2);
 | |
|     randomize_buffers(src_u, MAX_LINE_SIZE);
 | |
|     randomize_buffers(src_v, MAX_LINE_SIZE);
 | |
|     randomize_buffers(src_a, MAX_LINE_SIZE * 2);
 | |
| 
 | |
|     for (int dfi = 0; dfi < FF_ARRAY_ELEMS(dst_fmts); dfi++) {
 | |
|         int dst_pix_fmt = dst_fmts[dfi];
 | |
|         const AVPixFmtDescriptor *dst_desc = av_pix_fmt_desc_get(dst_pix_fmt);
 | |
|         int sample_size = av_get_padded_bits_per_pixel(dst_desc) >> 3;
 | |
|         for (int isi = 0; isi < FF_ARRAY_ELEMS(input_sizes); isi++) {
 | |
|             struct SwsContext *ctx;
 | |
|             int log_level;
 | |
|             int width = input_sizes[isi];
 | |
|             int srcSliceY = 0;
 | |
|             int srcSliceH = 2;
 | |
|             int srcStride[4] = {
 | |
|                 width,
 | |
|                 width >> src_desc->log2_chroma_w,
 | |
|                 width >> src_desc->log2_chroma_w,
 | |
|                 width,
 | |
|             };
 | |
|             int dstStride[4] = { MAX_LINE_SIZE * 6 };
 | |
| 
 | |
|             // override log level to prevent spamming of the message
 | |
|             // "No accelerated colorspace conversion found from %s to %s"
 | |
|             log_level = av_log_get_level();
 | |
|             av_log_set_level(AV_LOG_ERROR);
 | |
|             ctx = sws_getContext(width, srcSliceH, src_pix_fmt,
 | |
|                                  width, srcSliceH, dst_pix_fmt,
 | |
|                                  0, NULL, NULL, NULL);
 | |
|             av_log_set_level(log_level);
 | |
|             if (!ctx)
 | |
|                 fail();
 | |
| 
 | |
|             if (check_func(ctx->convert_unscaled, "%s_%s_%d", src_desc->name, dst_desc->name, width)) {
 | |
|                 memset(dst0_, 0xFF, 2 * MAX_LINE_SIZE * 6);
 | |
|                 memset(dst1_, 0xFF, 2 * MAX_LINE_SIZE * 6);
 | |
| 
 | |
|                 call_ref(ctx, src, srcStride, srcSliceY,
 | |
|                          srcSliceH, dst0, dstStride);
 | |
|                 call_new(ctx, src, srcStride, srcSliceY,
 | |
|                          srcSliceH, dst1, dstStride);
 | |
| 
 | |
|                 if (dst_pix_fmt == AV_PIX_FMT_ARGB  ||
 | |
|                     dst_pix_fmt == AV_PIX_FMT_ABGR  ||
 | |
|                     dst_pix_fmt == AV_PIX_FMT_RGBA  ||
 | |
|                     dst_pix_fmt == AV_PIX_FMT_BGRA  ||
 | |
|                     dst_pix_fmt == AV_PIX_FMT_RGB24 ||
 | |
|                     dst_pix_fmt == AV_PIX_FMT_BGR24) {
 | |
|                     if (cmp_off_by_n(lines0[0], lines1[0], width * sample_size, 3) ||
 | |
|                         cmp_off_by_n(lines0[1], lines1[1], width * sample_size, 3))
 | |
|                         fail();
 | |
|                 } else if (dst_pix_fmt == AV_PIX_FMT_RGB565 ||
 | |
|                            dst_pix_fmt == AV_PIX_FMT_BGR565) {
 | |
|                     if (cmp_565_by_n(lines0[0], lines1[0], width, 2) ||
 | |
|                         cmp_565_by_n(lines0[1], lines1[1], width, 2))
 | |
|                         fail();
 | |
|                 } else if (dst_pix_fmt == AV_PIX_FMT_RGB555 ||
 | |
|                            dst_pix_fmt == AV_PIX_FMT_BGR555) {
 | |
|                     if (cmp_555_by_n(lines0[0], lines1[0], width, 2) ||
 | |
|                         cmp_555_by_n(lines0[1], lines1[1], width, 2))
 | |
|                         fail();
 | |
|                 } else {
 | |
|                     fail();
 | |
|                 }
 | |
| 
 | |
|                 bench_new(ctx, src, srcStride, srcSliceY,
 | |
|                           srcSliceH, dst0, dstStride);
 | |
|             }
 | |
|             sws_freeContext(ctx);
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| #undef MAX_LINE_SIZE
 | |
| 
 | |
| void checkasm_check_sw_yuv2rgb(void)
 | |
| {
 | |
|     check_yuv2rgb(AV_PIX_FMT_YUV420P);
 | |
|     report("yuv420p");
 | |
|     check_yuv2rgb(AV_PIX_FMT_YUV422P);
 | |
|     report("yuv422p");
 | |
|     check_yuv2rgb(AV_PIX_FMT_YUVA420P);
 | |
|     report("yuva420p");
 | |
| }
 |