add sad_32x32 in pixelutils API, and update the fate. Signed-off-by: Jun Zhao <mypopydev@gmail.com>
		
			
				
	
	
		
			90 lines
		
	
	
		
			2.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			90 lines
		
	
	
		
			2.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * This file is part of FFmpeg.
 | |
|  *
 | |
|  * FFmpeg is free software; you can redistribute it and/or
 | |
|  * modify it under the terms of the GNU Lesser General Public
 | |
|  * License as published by the Free Software Foundation; either
 | |
|  * version 2.1 of the License, or (at your option) any later version.
 | |
|  *
 | |
|  * FFmpeg is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|  * Lesser General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU Lesser General Public
 | |
|  * License along with FFmpeg; if not, write to the Free Software
 | |
|  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 | |
|  */
 | |
| 
 | |
| #include "config.h"
 | |
| #include "common.h"
 | |
| #include "pixelutils.h"
 | |
| #include "internal.h"
 | |
| 
 | |
| #if CONFIG_PIXELUTILS
 | |
| 
 | |
| #include "x86/pixelutils.h"
 | |
| 
 | |
| static av_always_inline int sad_wxh(const uint8_t *src1, ptrdiff_t stride1,
 | |
|                                     const uint8_t *src2, ptrdiff_t stride2,
 | |
|                                     int w, int h)
 | |
| {
 | |
|     int x, y, sum = 0;
 | |
| 
 | |
|     for (y = 0; y < h; y++) {
 | |
|         for (x = 0; x < w; x++)
 | |
|             sum += abs(src1[x] - src2[x]);
 | |
|         src1 += stride1;
 | |
|         src2 += stride2;
 | |
|     }
 | |
|     return sum;
 | |
| }
 | |
| 
 | |
| #define DECLARE_BLOCK_FUNCTIONS(size)                                               \
 | |
| static int block_sad_##size##x##size##_c(const uint8_t *src1, ptrdiff_t stride1,    \
 | |
|                                          const uint8_t *src2, ptrdiff_t stride2)    \
 | |
| {                                                                                   \
 | |
|     return sad_wxh(src1, stride1, src2, stride2, size, size);                       \
 | |
| }
 | |
| 
 | |
| DECLARE_BLOCK_FUNCTIONS(2)
 | |
| DECLARE_BLOCK_FUNCTIONS(4)
 | |
| DECLARE_BLOCK_FUNCTIONS(8)
 | |
| DECLARE_BLOCK_FUNCTIONS(16)
 | |
| DECLARE_BLOCK_FUNCTIONS(32)
 | |
| 
 | |
| static const av_pixelutils_sad_fn sad_c[] = {
 | |
|     block_sad_2x2_c,
 | |
|     block_sad_4x4_c,
 | |
|     block_sad_8x8_c,
 | |
|     block_sad_16x16_c,
 | |
|     block_sad_32x32_c,
 | |
| };
 | |
| 
 | |
| #endif /* CONFIG_PIXELUTILS */
 | |
| 
 | |
| av_pixelutils_sad_fn av_pixelutils_get_sad_fn(int w_bits, int h_bits, int aligned, void *log_ctx)
 | |
| {
 | |
| #if !CONFIG_PIXELUTILS
 | |
|     av_log(log_ctx, AV_LOG_ERROR, "pixelutils support is required "
 | |
|            "but libavutil is not compiled with it\n");
 | |
|     return NULL;
 | |
| #else
 | |
|     av_pixelutils_sad_fn sad[FF_ARRAY_ELEMS(sad_c)];
 | |
| 
 | |
|     memcpy(sad, sad_c, sizeof(sad));
 | |
| 
 | |
|     if (w_bits < 1 || w_bits > FF_ARRAY_ELEMS(sad) ||
 | |
|         h_bits < 1 || h_bits > FF_ARRAY_ELEMS(sad))
 | |
|         return NULL;
 | |
|     if (w_bits != h_bits) // only squared sad for now
 | |
|         return NULL;
 | |
| 
 | |
| #if ARCH_X86
 | |
|     ff_pixelutils_sad_init_x86(sad, aligned);
 | |
| #endif
 | |
| 
 | |
|     return sad[w_bits - 1];
 | |
| #endif
 | |
| }
 |