x86/vf_stereo3d: make ff_anaglyph_sse4 work on x86_32
Reviewed-by: Paul B Mahol <onemda@gmail.com> Signed-off-by: James Almer <jamrial@gmail.com>
This commit is contained in:
		
							parent
							
								
									6e243d17e9
								
							
						
					
					
						commit
						1817643d4f
					
				@ -22,8 +22,6 @@
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
%include "libavutil/x86/x86util.asm"
 | 
					%include "libavutil/x86/x86util.asm"
 | 
				
			||||||
 | 
					
 | 
				
			||||||
%if ARCH_X86_64
 | 
					 | 
				
			||||||
 | 
					 | 
				
			||||||
SECTION_RODATA
 | 
					SECTION_RODATA
 | 
				
			||||||
 | 
					
 | 
				
			||||||
; rgbrgbrgbrgb
 | 
					; rgbrgbrgbrgb
 | 
				
			||||||
@ -37,10 +35,33 @@ ex_b: db 2,-1,-1,-1,5,-1,-1,-1,8,-1,-1,-1,11,-1,-1,-1
 | 
				
			|||||||
SECTION .text
 | 
					SECTION .text
 | 
				
			||||||
 | 
					
 | 
				
			||||||
INIT_XMM sse4
 | 
					INIT_XMM sse4
 | 
				
			||||||
 | 
					%if ARCH_X86_64
 | 
				
			||||||
cglobal anaglyph, 6, 10, 14, 2*6*mmsize, dst, lsrc, rsrc, dst_linesize, l_linesize, r_linesize, width, height, o, cnt
 | 
					cglobal anaglyph, 6, 10, 14, 2*6*mmsize, dst, lsrc, rsrc, dst_linesize, l_linesize, r_linesize, width, height, o, cnt
 | 
				
			||||||
%define ana_matrix_rq r6q
 | 
					%define ana_matrix_rq r6q
 | 
				
			||||||
%define ana_matrix_gq r7q
 | 
					%define ana_matrix_gq r7q
 | 
				
			||||||
%define ana_matrix_bq r8q
 | 
					%define ana_matrix_bq r8q
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					%else ; ARCH_X86_32
 | 
				
			||||||
 | 
					%if HAVE_ALIGNED_STACK
 | 
				
			||||||
 | 
					cglobal anaglyph, 3, 7, 8, 2*9*mmsize, dst, lsrc, rsrc, dst_linesize, l_linesize, o, cnt
 | 
				
			||||||
 | 
					%else
 | 
				
			||||||
 | 
					cglobal anaglyph, 3, 6, 8, 2*9*mmsize, dst, lsrc, rsrc, dst_linesize, o, cnt
 | 
				
			||||||
 | 
					%define l_linesizeq r4mp
 | 
				
			||||||
 | 
					%endif ; HAVE_ALIGNED_STACK
 | 
				
			||||||
 | 
					%define ana_matrix_rq r3q
 | 
				
			||||||
 | 
					%define ana_matrix_gq r4q
 | 
				
			||||||
 | 
					%define ana_matrix_bq r5q
 | 
				
			||||||
 | 
					%define r_linesizeq r5mp
 | 
				
			||||||
 | 
					%define widthd  r6mp
 | 
				
			||||||
 | 
					%define heightd r7mp
 | 
				
			||||||
 | 
					%define  m8 [rsp+mmsize*12]
 | 
				
			||||||
 | 
					%define  m9 [rsp+mmsize*13]
 | 
				
			||||||
 | 
					%define m10 [rsp+mmsize*14]
 | 
				
			||||||
 | 
					%define m11 [rsp+mmsize*15]
 | 
				
			||||||
 | 
					%define m12 [rsp+mmsize*16]
 | 
				
			||||||
 | 
					%define m13 [rsp+mmsize*17]
 | 
				
			||||||
 | 
					%endif ; ARCH
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    mov        ana_matrix_rq, r8m
 | 
					    mov        ana_matrix_rq, r8m
 | 
				
			||||||
    mov        ana_matrix_gq, r9m
 | 
					    mov        ana_matrix_gq, r9m
 | 
				
			||||||
    mov        ana_matrix_bq, r10m
 | 
					    mov        ana_matrix_bq, r10m
 | 
				
			||||||
@ -74,6 +95,7 @@ cglobal anaglyph, 6, 10, 14, 2*6*mmsize, dst, lsrc, rsrc, dst_linesize, l_linesi
 | 
				
			|||||||
    mova     [rsp+mmsize*10], m4
 | 
					    mova     [rsp+mmsize*10], m4
 | 
				
			||||||
    mova     [rsp+mmsize*11], m5
 | 
					    mova     [rsp+mmsize*11], m5
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					%if ARCH_X86_64
 | 
				
			||||||
    movu                 m11, [ana_matrix_bq+ 0]
 | 
					    movu                 m11, [ana_matrix_bq+ 0]
 | 
				
			||||||
    movq                 m13, [ana_matrix_bq+16]
 | 
					    movq                 m13, [ana_matrix_bq+16]
 | 
				
			||||||
    pshufd                m8, m11, q0000
 | 
					    pshufd                m8, m11, q0000
 | 
				
			||||||
@ -84,6 +106,26 @@ cglobal anaglyph, 6, 10, 14, 2*6*mmsize, dst, lsrc, rsrc, dst_linesize, l_linesi
 | 
				
			|||||||
    pshufd               m13, m13, q1111
 | 
					    pshufd               m13, m13, q1111
 | 
				
			||||||
    mov               widthd, dword widthm
 | 
					    mov               widthd, dword widthm
 | 
				
			||||||
    mov              heightd, dword heightm
 | 
					    mov              heightd, dword heightm
 | 
				
			||||||
 | 
					%else
 | 
				
			||||||
 | 
					    movu                  m3, [ana_matrix_bq+ 0]
 | 
				
			||||||
 | 
					    movq                  m5, [ana_matrix_bq+16]
 | 
				
			||||||
 | 
					    pshufd                m0, m3, q0000
 | 
				
			||||||
 | 
					    pshufd                m1, m3, q1111
 | 
				
			||||||
 | 
					    pshufd                m2, m3, q2222
 | 
				
			||||||
 | 
					    pshufd                m3, m3, q3333
 | 
				
			||||||
 | 
					    pshufd                m4, m5, q0000
 | 
				
			||||||
 | 
					    pshufd                m5, m5, q1111
 | 
				
			||||||
 | 
					    mova     [rsp+mmsize*12], m0
 | 
				
			||||||
 | 
					    mova     [rsp+mmsize*13], m1
 | 
				
			||||||
 | 
					    mova     [rsp+mmsize*14], m2
 | 
				
			||||||
 | 
					    mova     [rsp+mmsize*15], m3
 | 
				
			||||||
 | 
					    mova     [rsp+mmsize*16], m4
 | 
				
			||||||
 | 
					    mova     [rsp+mmsize*17], m5
 | 
				
			||||||
 | 
					    mov        dst_linesizeq, r3m
 | 
				
			||||||
 | 
					%if HAVE_ALIGNED_STACK
 | 
				
			||||||
 | 
					    mov          l_linesizeq, r4m
 | 
				
			||||||
 | 
					%endif
 | 
				
			||||||
 | 
					%endif ; ARCH
 | 
				
			||||||
 | 
					
 | 
				
			||||||
.nextrow:
 | 
					.nextrow:
 | 
				
			||||||
    mov                   od, widthd
 | 
					    mov                   od, widthd
 | 
				
			||||||
@ -172,4 +214,3 @@ cglobal anaglyph, 6, 10, 14, 2*6*mmsize, dst, lsrc, rsrc, dst_linesize, l_linesi
 | 
				
			|||||||
    sub       heightd, 1
 | 
					    sub       heightd, 1
 | 
				
			||||||
    jg .nextrow
 | 
					    jg .nextrow
 | 
				
			||||||
REP_RET
 | 
					REP_RET
 | 
				
			||||||
%endif
 | 
					 | 
				
			||||||
 | 
				
			|||||||
@ -31,7 +31,7 @@ void ff_stereo3d_init_x86(Stereo3DDSPContext *dsp)
 | 
				
			|||||||
{
 | 
					{
 | 
				
			||||||
    int cpu_flags = av_get_cpu_flags();
 | 
					    int cpu_flags = av_get_cpu_flags();
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    if (ARCH_X86_64 && EXTERNAL_SSE4(cpu_flags)) {
 | 
					    if (EXTERNAL_SSE4(cpu_flags)) {
 | 
				
			||||||
        dsp->anaglyph = ff_anaglyph_sse4;
 | 
					        dsp->anaglyph = ff_anaglyph_sse4;
 | 
				
			||||||
    }
 | 
					    }
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
				
			|||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user