x86: Update x86inc.asm
Make things up-to-date with upstream. https://code.videolan.org/videolan/x86inc.asm
This commit is contained in:
		
							parent
							
								
									782c4df28d
								
							
						
					
					
						commit
						afa471d0ef
					
				
							
								
								
									
										4
									
								
								configure
									
									
									
									
										vendored
									
									
								
							
							
						
						
									
										4
									
								
								configure
									
									
									
									
										vendored
									
									
								
							| @ -2222,7 +2222,6 @@ ARCH_EXT_LIST_RISCV=" | ||||
| 
 | ||||
| ARCH_EXT_LIST_X86=" | ||||
|     $ARCH_EXT_LIST_X86_SIMD | ||||
|     cpunop | ||||
|     i686 | ||||
| " | ||||
| 
 | ||||
| @ -2771,7 +2770,6 @@ mipsdsp_deps="mips" | ||||
| mipsdspr2_deps="mips" | ||||
| msa_deps="mipsfpu" | ||||
| 
 | ||||
| cpunop_deps="i686" | ||||
| x86_64_select="i686" | ||||
| x86_64_suggest="fast_cmov" | ||||
| 
 | ||||
| @ -6401,7 +6399,6 @@ EOF | ||||
|         done | ||||
|         disabled x86asm && die "nasm/yasm not found or too old. Use --disable-x86asm for a crippled build." | ||||
|         X86ASMFLAGS="-f $objformat" | ||||
|         enabled pic               && append X86ASMFLAGS "-DPIC" | ||||
|         test -n "$extern_prefix"  && append X86ASMFLAGS "-DPREFIX" | ||||
|         case "$objformat" in | ||||
|             elf*) enabled debug && append X86ASMFLAGS $x86asm_debug ;; | ||||
| @ -6412,7 +6409,6 @@ EOF | ||||
|         enabled avx2      && check_x86asm avx2_external      "vextracti128 xmm0, ymm0, 0" | ||||
|         enabled xop       && check_x86asm xop_external       "vpmacsdd xmm0, xmm1, xmm2, xmm3" | ||||
|         enabled fma4      && check_x86asm fma4_external      "vfmaddps ymm0, ymm1, ymm2, ymm3" | ||||
|         check_x86asm cpunop          "CPU amdnop" | ||||
|     fi | ||||
| 
 | ||||
|     case "$cpu" in | ||||
|  | ||||
| @ -74,7 +74,7 @@ SECTION .text | ||||
| ; "movaps m0, [r5 + r4]" if PIC is enabled | ||||
| ; "movaps m0, [constant_name + r4]" if texrel are used | ||||
| %macro SET_PIC_BASE 3; reg, const_label | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     %{1}     %2, [%3]      ; lea r5, [rip+const] | ||||
|     %define  pic_base_%3 %2 | ||||
| %else | ||||
| @ -195,7 +195,7 @@ align 16 | ||||
| ; PIC relative addressing. Use this | ||||
| ; to count it in cglobal | ||||
| ; | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|   %define num_pic_regs 1 | ||||
| %else | ||||
|   %define num_pic_regs 0 | ||||
|  | ||||
| @ -91,7 +91,7 @@ SECTION .text | ||||
| 
 | ||||
| %macro chroma_mc8_mmx_func 2-3 | ||||
| %ifidn %2, rv40 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
| %define rnd_1d_rv40 r8 | ||||
| %define rnd_2d_rv40 r8 | ||||
| %define extra_regs 2 | ||||
| @ -147,7 +147,7 @@ cglobal %1_%2_chroma_mc8%3, 6, 7 + extra_regs, 0 | ||||
|     or           r4d, r5d       ; x + y | ||||
| 
 | ||||
| %ifidn %2, rv40 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea           r8, [rnd_rv40_1d_tbl] | ||||
| %endif | ||||
| %if ARCH_X86_64 == 0 | ||||
| @ -198,7 +198,7 @@ cglobal %1_%2_chroma_mc8%3, 6, 7 + extra_regs, 0 | ||||
|     movd          m4, r4d         ; x | ||||
|     movd          m6, r5d         ; y | ||||
| %ifidn %2, rv40 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea           r8, [rnd_rv40_2d_tbl] | ||||
| %endif | ||||
| %if ARCH_X86_64 == 0 | ||||
| @ -283,7 +283,7 @@ cglobal %1_%2_chroma_mc8%3, 6, 7 + extra_regs, 0 | ||||
| %macro chroma_mc4_mmx_func 2 | ||||
| %define extra_regs 0 | ||||
| %ifidn %2, rv40 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
| %define extra_regs 1 | ||||
| %endif ; PIC | ||||
| %endif ; rv40 | ||||
| @ -301,7 +301,7 @@ cglobal %1_%2_chroma_mc4, 6, 6 + extra_regs, 0 | ||||
|     psubw         m5, m3 | ||||
| 
 | ||||
| %ifidn %2, rv40 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|    lea            r6, [rnd_rv40_2d_tbl] | ||||
| %define rnd_2d_rv40 r6 | ||||
| %else | ||||
|  | ||||
| @ -42,7 +42,7 @@ scan8_mem: db  4+ 1*8, 5+ 1*8, 4+ 2*8, 5+ 2*8 | ||||
|            db  6+11*8, 7+11*8, 6+12*8, 7+12*8 | ||||
|            db  4+13*8, 5+13*8, 4+14*8, 5+14*8 | ||||
|            db  6+13*8, 7+13*8, 6+14*8, 7+14*8 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
| %define npicregs 1 | ||||
| %define scan8 picregq | ||||
| %else | ||||
| @ -322,7 +322,7 @@ INIT_XMM sse2 | ||||
| cglobal h264_idct8_add4_8, 5, 8 + npicregs, 10, dst1, block_offset, block, stride, nnzc, cntr, coeff, dst2, picreg | ||||
|     movsxdifnidn r3, r3d | ||||
|     xor          r5, r5 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea     picregq, [scan8_mem] | ||||
| %endif | ||||
| .nextblock: | ||||
| @ -398,7 +398,7 @@ h264_idct_add8_mmx_plane: | ||||
| cglobal h264_idct_add8_422_8, 5, 8 + npicregs, 0, dst1, block_offset, block, stride, nnzc, cntr, coeff, dst2, picreg | ||||
| ; dst1, block_offset, block, stride, nnzc, cntr, coeff, dst2, picreg | ||||
|     movsxdifnidn r3, r3d | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea     picregq, [scan8_mem] | ||||
| %endif | ||||
| %if ARCH_X86_64 | ||||
|  | ||||
| @ -1311,10 +1311,7 @@ PRED8x8L_DOWN_RIGHT | ||||
| ;----------------------------------------------------------------------------- | ||||
| 
 | ||||
| %macro PRED8x8L_VERTICAL_RIGHT 0 | ||||
| cglobal pred8x8l_vertical_right_8, 4,5,7 | ||||
|     ; manually spill XMM registers for Win64 because | ||||
|     ; the code here is initialized with INIT_MMX | ||||
|     WIN64_SPILL_XMM 7 | ||||
| cglobal pred8x8l_vertical_right_8, 4,5,6 | ||||
|     sub          r0, r3 | ||||
|     lea          r4, [r0+r3*2] | ||||
|     movq        mm0, [r0+r3*1-8] | ||||
| @ -1384,7 +1381,6 @@ cglobal pred8x8l_vertical_right_8, 4,5,7 | ||||
|     movq2dq     xmm4, mm6 | ||||
|     pslldq      xmm4, 8 | ||||
|     por         xmm0, xmm4 | ||||
|     movdqa      xmm6, [pw_ff00] | ||||
|     movdqa      xmm1, xmm0 | ||||
|     lea           r2, [r1+r3*2] | ||||
|     movdqa      xmm2, xmm0 | ||||
| @ -1394,15 +1390,16 @@ cglobal pred8x8l_vertical_right_8, 4,5,7 | ||||
|     pavgb       xmm2, xmm0 | ||||
| INIT_XMM cpuname | ||||
|     PRED4x4_LOWPASS xmm4, xmm3, xmm1, xmm0, xmm5 | ||||
|     pandn       xmm6, xmm4 | ||||
|     movdqa      xmm0, [pw_ff00] | ||||
|     pandn       xmm0, xmm4 | ||||
|     movdqa      xmm5, xmm4 | ||||
|     psrlw       xmm4, 8 | ||||
|     packuswb    xmm6, xmm4 | ||||
|     movhlps     xmm4, xmm6 | ||||
|     packuswb    xmm0, xmm4 | ||||
|     movhlps     xmm4, xmm0 | ||||
|     movhps [r0+r3*2], xmm5 | ||||
|     movhps [r0+r3*1], xmm2 | ||||
|     psrldq      xmm5, 4 | ||||
|     movss       xmm5, xmm6 | ||||
|     movss       xmm5, xmm0 | ||||
|     psrldq      xmm2, 4 | ||||
|     movss       xmm2, xmm4 | ||||
|     lea           r0, [r2+r3*2] | ||||
|  | ||||
| @ -180,7 +180,7 @@ SECTION .text | ||||
| %macro EPEL_FILTER 5 ; bit depth, filter index, xmma, xmmb, gprtmp | ||||
| %if cpuflag(avx2) | ||||
| %assign %%offset 32 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea              %5q, [hevc_epel_filters_avx2_%1] | ||||
|     %define FILTER %5q | ||||
| %else | ||||
| @ -188,7 +188,7 @@ SECTION .text | ||||
| %endif | ||||
| %else | ||||
| %assign %%offset 16 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea              %5q, [hevc_epel_filters_sse4_%1] | ||||
|     %define FILTER %5q | ||||
| %else | ||||
| @ -216,7 +216,7 @@ SECTION .text | ||||
| %define %%table  hevc_epel_filters_sse4_%1 | ||||
| %endif | ||||
| 
 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea           r3srcq, [%%table] | ||||
|     %define FILTER r3srcq | ||||
| %else | ||||
| @ -234,7 +234,7 @@ SECTION .text | ||||
| %else | ||||
| %define %%table  hevc_epel_filters_sse4_10 | ||||
| %endif | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea           r3srcq, [%%table] | ||||
|     %define FILTER r3srcq | ||||
| %else | ||||
| @ -257,7 +257,7 @@ SECTION .text | ||||
| %define %%table  hevc_qpel_filters_sse4_%1 | ||||
| %endif | ||||
| 
 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea         rfilterq, [%%table] | ||||
| %else | ||||
|     %define rfilterq %%table | ||||
| @ -576,7 +576,7 @@ SECTION .text | ||||
| %define %%table  hevc_qpel_filters_sse4_%2 | ||||
| %endif | ||||
| 
 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea         rfilterq, [%%table] | ||||
| %else | ||||
|     %define rfilterq %%table | ||||
| @ -1288,7 +1288,7 @@ HEVC_PUT_HEVC_QPEL_HV 16, 10 | ||||
| %assign %%offset 4 | ||||
|     dec %2q | ||||
|     shl %2q, 3 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea %5q, [%%table] | ||||
|     %define FILTER %5q | ||||
| %else | ||||
| @ -1365,7 +1365,7 @@ cglobal hevc_put_hevc_qpel_hv%1_%2, 6, 7, 27, dst, src, srcstride, height, mx, m | ||||
|     sub             myq, 1 | ||||
|     shl             myq, 5 | ||||
| %define %%table hevc_qpel_filters_avx512icl_v_%1 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea tmpq, [%%table] | ||||
|     %define FILTER tmpq | ||||
| %else | ||||
|  | ||||
| @ -51,7 +51,7 @@ sixtap_filter_v_m:   times 8 dw   1 | ||||
|                      times 8 dw  20 | ||||
|                      times 8 dw  52 | ||||
| 
 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
| %define sixtap_filter_hw   picregq | ||||
| %define sixtap_filter_hb   picregq | ||||
| %define sixtap_filter_v    picregq | ||||
| @ -84,7 +84,7 @@ SECTION .text | ||||
| %if WIN64 | ||||
|    movsxd   %1q, %1d | ||||
| %endif | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|    add      %1q, picregq | ||||
| %else | ||||
|    add      %1q, %2 | ||||
| @ -104,7 +104,7 @@ SECTION .text | ||||
| 
 | ||||
| %macro FILTER_V 1 | ||||
| cglobal %1_rv40_qpel_v, 6,6+npicregs,12, dst, dststride, src, srcstride, height, my, picreg | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [sixtap_filter_v_m] | ||||
| %endif | ||||
|     pxor      m7, m7 | ||||
| @ -175,7 +175,7 @@ cglobal %1_rv40_qpel_v, 6,6+npicregs,12, dst, dststride, src, srcstride, height, | ||||
| 
 | ||||
| %macro FILTER_H  1 | ||||
| cglobal %1_rv40_qpel_h, 6, 6+npicregs, 12, dst, dststride, src, srcstride, height, mx, picreg | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [sixtap_filter_v_m] | ||||
| %endif | ||||
|     pxor      m7, m7 | ||||
| @ -238,7 +238,7 @@ FILTER_V  avg | ||||
| 
 | ||||
| %macro FILTER_SSSE3 1 | ||||
| cglobal %1_rv40_qpel_v, 6,6+npicregs,8, dst, dststride, src, srcstride, height, my, picreg | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [sixtap_filter_hb_m] | ||||
| %endif | ||||
| 
 | ||||
| @ -283,7 +283,7 @@ cglobal %1_rv40_qpel_v, 6,6+npicregs,8, dst, dststride, src, srcstride, height, | ||||
|     RET | ||||
| 
 | ||||
| cglobal %1_rv40_qpel_h, 6,6+npicregs,8, dst, dststride, src, srcstride, height, mx, picreg | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [sixtap_filter_hb_m] | ||||
| %endif | ||||
|     mova      m3, [filter_h6_shuf2] | ||||
|  | ||||
| @ -308,7 +308,7 @@ cglobal sbr_qmf_pre_shuffle, 1,4,6,z | ||||
|     movq    [r2q], m2 | ||||
|     RET | ||||
| 
 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
| %define NREGS 1 | ||||
| %if UNIX64 | ||||
| %define NOISE_TABLE r6q ; r5q is m_max | ||||
| @ -321,7 +321,7 @@ cglobal sbr_qmf_pre_shuffle, 1,4,6,z | ||||
| %endif | ||||
| 
 | ||||
| %macro LOAD_NST  1 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  NOISE_TABLE, [%1] | ||||
|     mova          m0, [kxq + NOISE_TABLE] | ||||
| %else | ||||
| @ -371,7 +371,7 @@ apply_noise_main: | ||||
|     movsxdifnidn    noiseq, noised | ||||
|     dec    noiseq | ||||
|     shl    countd, 2 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea NOISE_TABLE, [sbr_noise_table] | ||||
| %endif | ||||
|     lea        Yq, [Yq + 2*countq] | ||||
|  | ||||
| @ -114,7 +114,7 @@ bilinear_filter_vb_m: times 8 db 7, 1 | ||||
|                       times 8 db 2, 6 | ||||
|                       times 8 db 1, 7 | ||||
| 
 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
| %define fourtap_filter_hw  picregq | ||||
| %define sixtap_filter_hw   picregq | ||||
| %define fourtap_filter_hb  picregq | ||||
| @ -166,7 +166,7 @@ cglobal put_vp8_epel%1_h6, 6, 6 + npicregs, 8, dst, dststride, src, srcstride, h | ||||
|     lea      mxd, [mxq*3] | ||||
|     mova      m3, [filter_h6_shuf2] | ||||
|     mova      m4, [filter_h6_shuf3] | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [sixtap_filter_hb_m] | ||||
| %endif | ||||
|     mova      m5, [sixtap_filter_hb+mxq*8-48] ; set up 6tap filter in bytes | ||||
| @ -207,7 +207,7 @@ cglobal put_vp8_epel%1_h4, 6, 6 + npicregs, 7, dst, dststride, src, srcstride, h | ||||
|     mova      m2, [pw_256] | ||||
|     mova      m3, [filter_h2_shuf] | ||||
|     mova      m4, [filter_h4_shuf] | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [fourtap_filter_hb_m] | ||||
| %endif | ||||
|     mova      m5, [fourtap_filter_hb+mxq-16] ; set up 4tap filter in bytes | ||||
| @ -234,7 +234,7 @@ cglobal put_vp8_epel%1_h4, 6, 6 + npicregs, 7, dst, dststride, src, srcstride, h | ||||
| 
 | ||||
| cglobal put_vp8_epel%1_v4, 7, 7, 8, dst, dststride, src, srcstride, height, picreg, my | ||||
|     shl      myd, 4 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [fourtap_filter_hb_m] | ||||
| %endif | ||||
|     mova      m5, [fourtap_filter_hb+myq-16] | ||||
| @ -272,7 +272,7 @@ cglobal put_vp8_epel%1_v4, 7, 7, 8, dst, dststride, src, srcstride, height, picr | ||||
| 
 | ||||
| cglobal put_vp8_epel%1_v6, 7, 7, 8, dst, dststride, src, srcstride, height, picreg, my | ||||
|     lea      myd, [myq*3] | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [sixtap_filter_hb_m] | ||||
| %endif | ||||
|     lea      myq, [sixtap_filter_hb+myq*8] | ||||
| @ -326,7 +326,7 @@ FILTER_SSSE3 8 | ||||
| INIT_MMX mmxext | ||||
| cglobal put_vp8_epel4_h4, 6, 6 + npicregs, 0, dst, dststride, src, srcstride, height, mx, picreg | ||||
|     shl       mxd, 4 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea   picregq, [fourtap_filter_hw_m] | ||||
| %endif | ||||
|     movq      mm4, [fourtap_filter_hw+mxq-16] ; set up 4tap filter in words | ||||
| @ -374,7 +374,7 @@ cglobal put_vp8_epel4_h4, 6, 6 + npicregs, 0, dst, dststride, src, srcstride, he | ||||
| INIT_MMX mmxext | ||||
| cglobal put_vp8_epel4_h6, 6, 6 + npicregs, 0, dst, dststride, src, srcstride, height, mx, picreg | ||||
|     lea       mxd, [mxq*3] | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea   picregq, [sixtap_filter_hw_m] | ||||
| %endif | ||||
|     movq      mm4, [sixtap_filter_hw+mxq*8-48] ; set up 4tap filter in words | ||||
| @ -431,7 +431,7 @@ cglobal put_vp8_epel4_h6, 6, 6 + npicregs, 0, dst, dststride, src, srcstride, he | ||||
| INIT_XMM sse2 | ||||
| cglobal put_vp8_epel8_h4, 6, 6 + npicregs, 10, dst, dststride, src, srcstride, height, mx, picreg | ||||
|     shl      mxd, 5 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [fourtap_filter_v_m] | ||||
| %endif | ||||
|     lea      mxq, [fourtap_filter_v+mxq-32] | ||||
| @ -480,7 +480,7 @@ INIT_XMM sse2 | ||||
| cglobal put_vp8_epel8_h6, 6, 6 + npicregs, 14, dst, dststride, src, srcstride, height, mx, picreg | ||||
|     lea      mxd, [mxq*3] | ||||
|     shl      mxd, 4 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [sixtap_filter_v_m] | ||||
| %endif | ||||
|     lea      mxq, [sixtap_filter_v+mxq-96] | ||||
| @ -543,7 +543,7 @@ cglobal put_vp8_epel8_h6, 6, 6 + npicregs, 14, dst, dststride, src, srcstride, h | ||||
| ; 4x4 block, V-only 4-tap filter | ||||
| cglobal put_vp8_epel%1_v4, 7, 7, 8, dst, dststride, src, srcstride, height, picreg, my | ||||
|     shl      myd, 5 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [fourtap_filter_v_m] | ||||
| %endif | ||||
|     lea      myq, [fourtap_filter_v+myq-32] | ||||
| @ -597,7 +597,7 @@ cglobal put_vp8_epel%1_v4, 7, 7, 8, dst, dststride, src, srcstride, height, picr | ||||
| cglobal put_vp8_epel%1_v6, 7, 7, 8, dst, dststride, src, srcstride, height, picreg, my | ||||
|     shl      myd, 4 | ||||
|     lea      myq, [myq*3] | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [sixtap_filter_v_m] | ||||
| %endif | ||||
|     lea      myq, [sixtap_filter_v+myq-96] | ||||
| @ -667,7 +667,7 @@ FILTER_V 8 | ||||
| %if cpuflag(ssse3) | ||||
| cglobal put_vp8_bilinear%1_v, 7, 7, 5, dst, dststride, src, srcstride, height, picreg, my | ||||
|     shl      myd, 4 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [bilinear_filter_vb_m] | ||||
| %endif | ||||
|     pxor      m4, m4 | ||||
| @ -697,7 +697,7 @@ cglobal put_vp8_bilinear%1_v, 7, 7, 5, dst, dststride, src, srcstride, height, p | ||||
| %else ; cpuflag(ssse3) | ||||
| cglobal put_vp8_bilinear%1_v, 7, 7, 7, dst, dststride, src, srcstride, height, picreg, my | ||||
|     shl      myd, 4 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [bilinear_filter_vw_m] | ||||
| %endif | ||||
|     pxor      m6, m6 | ||||
| @ -743,7 +743,7 @@ cglobal put_vp8_bilinear%1_v, 7, 7, 7, dst, dststride, src, srcstride, height, p | ||||
| %if cpuflag(ssse3) | ||||
| cglobal put_vp8_bilinear%1_h, 6, 6 + npicregs, 5, dst, dststride, src, srcstride, height, mx, picreg | ||||
|     shl      mxd, 4 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [bilinear_filter_vb_m] | ||||
| %endif | ||||
|     pxor      m4, m4 | ||||
| @ -773,7 +773,7 @@ cglobal put_vp8_bilinear%1_h, 6, 6 + npicregs, 5, dst, dststride, src, srcstride | ||||
| %else ; cpuflag(ssse3) | ||||
| cglobal put_vp8_bilinear%1_h, 6, 6 + npicregs, 7, dst, dststride, src, srcstride, height, mx, picreg | ||||
|     shl      mxd, 4 | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea  picregq, [bilinear_filter_vw_m] | ||||
| %endif | ||||
|     pxor      m6, m6 | ||||
|  | ||||
| @ -330,7 +330,9 @@ IDCT_4x4_FN ssse3 | ||||
| INIT_MMX %5 | ||||
| cglobal vp9_%1_%3_4x4_add, 3, 3, 0, dst, stride, block, eob | ||||
| %if WIN64 && notcpuflag(ssse3) | ||||
| INIT_XMM cpuname | ||||
|     WIN64_SPILL_XMM 8 | ||||
| INIT_MMX cpuname | ||||
| %endif | ||||
|     movdqa            xmm5, [pd_8192] | ||||
|     mova                m0, [blockq+ 0] | ||||
|  | ||||
| @ -303,7 +303,9 @@ IDCT4_10_FN | ||||
| %macro IADST4_FN 4 | ||||
| cglobal vp9_%1_%3_4x4_add_10, 3, 3, 0, dst, stride, block, eob | ||||
| %if WIN64 && notcpuflag(ssse3) | ||||
| INIT_XMM cpuname | ||||
|     WIN64_SPILL_XMM 8 | ||||
| INIT_MMX cpuname | ||||
| %endif | ||||
|     movdqa            xmm5, [pd_8192] | ||||
|     mova                m0, [blockq+0*16+0] | ||||
| @ -672,7 +674,7 @@ cglobal vp9_idct_idct_8x8_add_10, 4, 6 + ARCH_X86_64, 14, \ | ||||
|     mov            dstbakq, dstq | ||||
|     movsxd            cntq, cntd | ||||
| %endif | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea               ptrq, [default_8x8] | ||||
|     movzx             cntd, byte [ptrq+cntq-1] | ||||
| %else | ||||
| @ -921,7 +923,7 @@ cglobal vp9_%1_%3_8x8_add_10, 4, 6 + ARCH_X86_64, 16, \ | ||||
|     mov            dstbakq, dstq | ||||
|     movsxd            cntq, cntd | ||||
| %endif | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea               ptrq, [%5_8x8] | ||||
|     movzx             cntd, byte [ptrq+cntq-1] | ||||
| %else | ||||
| @ -1128,7 +1130,7 @@ cglobal vp9_idct_idct_16x16_add_10, 4, 6 + ARCH_X86_64, 16, \ | ||||
|     mov            dstbakq, dstq | ||||
|     movsxd            cntq, cntd | ||||
| %endif | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea               ptrq, [default_16x16] | ||||
|     movzx             cntd, byte [ptrq+cntq-1] | ||||
| %else | ||||
| @ -1445,7 +1447,7 @@ cglobal vp9_%1_%4_16x16_add_10, 4, 6 + ARCH_X86_64, 16, \ | ||||
|     mov            dstbakq, dstq | ||||
|     movsxd            cntq, cntd | ||||
| %endif | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea               ptrq, [%7_16x16] | ||||
|     movzx             cntd, byte [ptrq+cntq-1] | ||||
| %else | ||||
| @ -1958,7 +1960,7 @@ cglobal vp9_idct_idct_32x32_add_10, 4, 6 + ARCH_X86_64, 16, \ | ||||
|     mov            dstbakq, dstq | ||||
|     movsxd            cntq, cntd | ||||
| %endif | ||||
| %ifdef PIC | ||||
| %if PIC | ||||
|     lea               ptrq, [default_32x32] | ||||
|     movzx             cntd, byte [ptrq+cntq-1] | ||||
| %else | ||||
|  | ||||
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user