This reverts commitstags/n4.01a5865b6dcand8fb1d63d91. They made fate interlace tests fail when AVX2 was used. Signed-off-by: James Almer <jamrial@gmail.com>
| @@ -201,10 +201,5 @@ LOWPASS_LINE | |||||
| INIT_XMM avx | INIT_XMM avx | ||||
| LOWPASS_LINE | LOWPASS_LINE | ||||
| %if HAVE_AVX2_EXTERNAL | |||||
| INIT_YMM avx2 | |||||
| LOWPASS_LINE | |||||
| %endif | |||||
| INIT_XMM sse2 | INIT_XMM sse2 | ||||
| LOWPASS_LINE_COMPLEX | LOWPASS_LINE_COMPLEX | ||||
| @@ -32,9 +32,6 @@ void ff_lowpass_line_sse2(uint8_t *dstp, ptrdiff_t linesize, | |||||
| void ff_lowpass_line_avx (uint8_t *dstp, ptrdiff_t linesize, | void ff_lowpass_line_avx (uint8_t *dstp, ptrdiff_t linesize, | ||||
| const uint8_t *srcp, ptrdiff_t mref, | const uint8_t *srcp, ptrdiff_t mref, | ||||
| ptrdiff_t pref, int clip_max); | ptrdiff_t pref, int clip_max); | ||||
| void ff_lowpass_line_avx2 (uint8_t *dstp, ptrdiff_t linesize, | |||||
| const uint8_t *srcp, ptrdiff_t mref, | |||||
| ptrdiff_t pref, int clip_max); | |||||
| void ff_lowpass_line_16_sse2(uint8_t *dstp, ptrdiff_t linesize, | void ff_lowpass_line_16_sse2(uint8_t *dstp, ptrdiff_t linesize, | ||||
| const uint8_t *srcp, ptrdiff_t mref, | const uint8_t *srcp, ptrdiff_t mref, | ||||
| @@ -42,9 +39,6 @@ void ff_lowpass_line_16_sse2(uint8_t *dstp, ptrdiff_t linesize, | |||||
| void ff_lowpass_line_16_avx (uint8_t *dstp, ptrdiff_t linesize, | void ff_lowpass_line_16_avx (uint8_t *dstp, ptrdiff_t linesize, | ||||
| const uint8_t *srcp, ptrdiff_t mref, | const uint8_t *srcp, ptrdiff_t mref, | ||||
| ptrdiff_t pref, int clip_max); | ptrdiff_t pref, int clip_max); | ||||
| void ff_lowpass_line_16_avx2 (uint8_t *dstp, ptrdiff_t linesize, | |||||
| const uint8_t *srcp, ptrdiff_t mref, | |||||
| ptrdiff_t pref, int clip_max); | |||||
| void ff_lowpass_line_complex_sse2(uint8_t *dstp, ptrdiff_t linesize, | void ff_lowpass_line_complex_sse2(uint8_t *dstp, ptrdiff_t linesize, | ||||
| const uint8_t *srcp, ptrdiff_t mref, | const uint8_t *srcp, ptrdiff_t mref, | ||||
| @@ -68,9 +62,6 @@ av_cold void ff_interlace_init_x86(InterlaceContext *s, int depth) | |||||
| if (EXTERNAL_AVX(cpu_flags)) | if (EXTERNAL_AVX(cpu_flags)) | ||||
| if (s->lowpass == VLPF_LIN) | if (s->lowpass == VLPF_LIN) | ||||
| s->lowpass_line = ff_lowpass_line_16_avx; | s->lowpass_line = ff_lowpass_line_16_avx; | ||||
| if (EXTERNAL_AVX2_FAST(cpu_flags)) | |||||
| if (s->lowpass == VLPF_LIN) | |||||
| s->lowpass_line = ff_lowpass_line_16_avx2; | |||||
| } else { | } else { | ||||
| if (EXTERNAL_SSE2(cpu_flags)) { | if (EXTERNAL_SSE2(cpu_flags)) { | ||||
| if (s->lowpass == VLPF_LIN) | if (s->lowpass == VLPF_LIN) | ||||
| @@ -81,8 +72,5 @@ av_cold void ff_interlace_init_x86(InterlaceContext *s, int depth) | |||||
| if (EXTERNAL_AVX(cpu_flags)) | if (EXTERNAL_AVX(cpu_flags)) | ||||
| if (s->lowpass == VLPF_LIN) | if (s->lowpass == VLPF_LIN) | ||||
| s->lowpass_line = ff_lowpass_line_avx; | s->lowpass_line = ff_lowpass_line_avx; | ||||
| if (EXTERNAL_AVX2_FAST(cpu_flags)) | |||||
| if (s->lowpass == VLPF_LIN) | |||||
| s->lowpass_line = ff_lowpass_line_avx2; | |||||
| } | } | ||||
| } | } | ||||
| @@ -33,9 +33,6 @@ void ff_lowpass_line_sse2(uint8_t *dstp, ptrdiff_t linesize, | |||||
| void ff_lowpass_line_avx (uint8_t *dstp, ptrdiff_t linesize, | void ff_lowpass_line_avx (uint8_t *dstp, ptrdiff_t linesize, | ||||
| const uint8_t *srcp, ptrdiff_t mref, | const uint8_t *srcp, ptrdiff_t mref, | ||||
| ptrdiff_t pref, int clip_max); | ptrdiff_t pref, int clip_max); | ||||
| void ff_lowpass_line_avx2 (uint8_t *dstp, ptrdiff_t linesize, | |||||
| const uint8_t *srcp, ptrdiff_t mref, | |||||
| ptrdiff_t pref, int clip_max); | |||||
| void ff_lowpass_line_16_sse2(uint8_t *dstp, ptrdiff_t linesize, | void ff_lowpass_line_16_sse2(uint8_t *dstp, ptrdiff_t linesize, | ||||
| const uint8_t *srcp, ptrdiff_t mref, | const uint8_t *srcp, ptrdiff_t mref, | ||||
| @@ -43,9 +40,6 @@ void ff_lowpass_line_16_sse2(uint8_t *dstp, ptrdiff_t linesize, | |||||
| void ff_lowpass_line_16_avx (uint8_t *dstp, ptrdiff_t linesize, | void ff_lowpass_line_16_avx (uint8_t *dstp, ptrdiff_t linesize, | ||||
| const uint8_t *srcp, ptrdiff_t mref, | const uint8_t *srcp, ptrdiff_t mref, | ||||
| ptrdiff_t pref, int clip_max); | ptrdiff_t pref, int clip_max); | ||||
| void ff_lowpass_line_16_avx2 (uint8_t *dstp, ptrdiff_t linesize, | |||||
| const uint8_t *srcp, ptrdiff_t mref, | |||||
| ptrdiff_t pref, int clip_max); | |||||
| void ff_lowpass_line_complex_sse2(uint8_t *dstp, ptrdiff_t linesize, | void ff_lowpass_line_complex_sse2(uint8_t *dstp, ptrdiff_t linesize, | ||||
| const uint8_t *srcp, ptrdiff_t mref, | const uint8_t *srcp, ptrdiff_t mref, | ||||
| @@ -69,11 +63,6 @@ av_cold void ff_tinterlace_init_x86(TInterlaceContext *s) | |||||
| if (EXTERNAL_AVX(cpu_flags)) | if (EXTERNAL_AVX(cpu_flags)) | ||||
| if (!(s->flags & TINTERLACE_FLAG_CVLPF)) | if (!(s->flags & TINTERLACE_FLAG_CVLPF)) | ||||
| s->lowpass_line = ff_lowpass_line_16_avx; | s->lowpass_line = ff_lowpass_line_16_avx; | ||||
| if (EXTERNAL_AVX2_FAST(cpu_flags)) { | |||||
| if (!(s->flags & TINTERLACE_FLAG_CVLPF)) { | |||||
| s->lowpass_line = ff_lowpass_line_16_avx2; | |||||
| } | |||||
| } | |||||
| } else { | } else { | ||||
| if (EXTERNAL_SSE2(cpu_flags)) { | if (EXTERNAL_SSE2(cpu_flags)) { | ||||
| if (!(s->flags & TINTERLACE_FLAG_CVLPF)) | if (!(s->flags & TINTERLACE_FLAG_CVLPF)) | ||||
| @@ -84,10 +73,5 @@ av_cold void ff_tinterlace_init_x86(TInterlaceContext *s) | |||||
| if (EXTERNAL_AVX(cpu_flags)) | if (EXTERNAL_AVX(cpu_flags)) | ||||
| if (!(s->flags & TINTERLACE_FLAG_CVLPF)) | if (!(s->flags & TINTERLACE_FLAG_CVLPF)) | ||||
| s->lowpass_line = ff_lowpass_line_avx; | s->lowpass_line = ff_lowpass_line_avx; | ||||
| if (EXTERNAL_AVX2_FAST(cpu_flags)) { | |||||
| if (!(s->flags & TINTERLACE_FLAG_CVLPF)) { | |||||
| s->lowpass_line = ff_lowpass_line_avx2; | |||||
| } | |||||
| } | |||||
| } | } | ||||
| } | } | ||||