Path: blob/master/3rdparty/libpng/intel/intel_init.c
16337 views
1/* intel_init.c - SSE2 optimized filter functions2*3* Copyright (c) 2016-2017 Glenn Randers-Pehrson4* Written by Mike Klein and Matt Sarett, Google, Inc.5* Derived from arm/arm_init.c6*7* Last changed in libpng 1.6.29 [March 16, 2017]8*9* This code is released under the libpng license.10* For conditions of distribution and use, see the disclaimer11* and license in png.h12*/1314#include "../pngpriv.h"1516#ifdef PNG_READ_SUPPORTED17#if PNG_INTEL_SSE_IMPLEMENTATION > 01819void20png_init_filter_functions_sse2(png_structp pp, unsigned int bpp)21{22/* The techniques used to implement each of these filters in SSE operate on23* one pixel at a time.24* So they generally speed up 3bpp images about 3x, 4bpp images about 4x.25* They can scale up to 6 and 8 bpp images and down to 2 bpp images,26* but they'd not likely have any benefit for 1bpp images.27* Most of these can be implemented using only MMX and 64-bit registers,28* but they end up a bit slower than using the equally-ubiquitous SSE2.29*/30png_debug(1, "in png_init_filter_functions_sse2");31if (bpp == 3)32{33pp->read_filter[PNG_FILTER_VALUE_SUB-1] = png_read_filter_row_sub3_sse2;34pp->read_filter[PNG_FILTER_VALUE_AVG-1] = png_read_filter_row_avg3_sse2;35pp->read_filter[PNG_FILTER_VALUE_PAETH-1] =36png_read_filter_row_paeth3_sse2;37}38else if (bpp == 4)39{40pp->read_filter[PNG_FILTER_VALUE_SUB-1] = png_read_filter_row_sub4_sse2;41pp->read_filter[PNG_FILTER_VALUE_AVG-1] = png_read_filter_row_avg4_sse2;42pp->read_filter[PNG_FILTER_VALUE_PAETH-1] =43png_read_filter_row_paeth4_sse2;44}4546/* No need optimize PNG_FILTER_VALUE_UP. The compiler should47* autovectorize.48*/49}5051#endif /* PNG_INTEL_SSE_IMPLEMENTATION > 0 */52#endif /* PNG_READ_SUPPORTED */535455