On Wed, Jun 21, 2017 at 09:46:58AM -0400, Ronald S. Bultje wrote:
> ---
>  libavfilter/x86/vf_spp.c | 15 ++++++++++++++-
>  1 file changed, 14 insertions(+), 1 deletion(-)
> 
> diff --git a/libavfilter/x86/vf_spp.c b/libavfilter/x86/vf_spp.c
> index 45a9eb0..8e3c820 100644
> --- a/libavfilter/x86/vf_spp.c
> +++ b/libavfilter/x86/vf_spp.c
> @@ -217,6 +217,17 @@ static void store_slice_mmx(uint8_t *dst, const int16_t 
> *src,
>  
>  #endif /* HAVE_MMX_INLINE */
>  
> +static const uint8_t simple_mmx_permutation[64] = {
> +    0x00, 0x08, 0x04, 0x09, 0x01, 0x0C, 0x05, 0x0D,
> +    0x10, 0x18, 0x14, 0x19, 0x11, 0x1C, 0x15, 0x1D,
> +    0x20, 0x28, 0x24, 0x29, 0x21, 0x2C, 0x25, 0x2D,
> +    0x12, 0x1A, 0x16, 0x1B, 0x13, 0x1E, 0x17, 0x1F,
> +    0x02, 0x0A, 0x06, 0x0B, 0x03, 0x0E, 0x07, 0x0F,
> +    0x30, 0x38, 0x34, 0x39, 0x31, 0x3C, 0x35, 0x3D,
> +    0x22, 0x2A, 0x26, 0x2B, 0x23, 0x2E, 0x27, 0x2F,
> +    0x32, 0x3A, 0x36, 0x3B, 0x33, 0x3E, 0x37, 0x3F,
> +};
> +
>  av_cold void ff_spp_init_x86(SPPContext *s)
>  {
>  #if HAVE_MMX_INLINE
> @@ -226,7 +237,9 @@ av_cold void ff_spp_init_x86(SPPContext *s)
>          int64_t bps;
>          s->store_slice = store_slice_mmx;
>          av_opt_get_int(s->dct, "bits_per_sample", 0, &bps);
> -        if (bps <= 8) {
> +        if (bps <= 8 &&
> +            !memcmp(s->dct->idct_permutation, simple_mmx_permutation,
> +                    sizeof(simple_mmx_permutation))) {

this would disable the SIMD code

also the memcmp() is a very ugly way to check the permutation

[...]

-- 
Michael     GnuPG fingerprint: 9FF2128B147EF6730BADF133611EC787040B0FAB

It is dangerous to be right in matters on which the established authorities
are wrong. -- Voltaire

Attachment: signature.asc
Description: Digital signature

_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
http://ffmpeg.org/mailman/listinfo/ffmpeg-devel

Reply via email to