1 // Copyright 2015 Google Inc. All Rights Reserved.
2 //
3 // Use of this source code is governed by a BSD-style license
4 // that can be found in the COPYING file in the root of the source
5 // tree. An additional intellectual property rights grant can be found
6 // in the file PATENTS. All contributing project authors may
7 // be found in the AUTHORS file in the root of the source tree.
8 // -----------------------------------------------------------------------------
9 //
10 // SSE4 version of some decoding functions.
11 //
12 // Author: Skal (pascal.massimino@gmail.com)
13 
14 #include "src/dsp/dsp.h"
15 
16 #if defined(WEBP_USE_SSE41)
17 
18 #include <smmintrin.h>
19 #include "src/dec/vp8i_dec.h"
20 #include "src/utils/utils.h"
21 
HE16_SSE41(uint8_t * dst)22 static void HE16_SSE41(uint8_t* dst) {     // horizontal
23   int j;
24   const __m128i kShuffle3 = _mm_set1_epi8(3);
25   for (j = 16; j > 0; --j) {
26     const __m128i in = _mm_cvtsi32_si128(WebPMemToUint32(dst - 4));
27     const __m128i values = _mm_shuffle_epi8(in, kShuffle3);
28     _mm_storeu_si128((__m128i*)dst, values);
29     dst += BPS;
30   }
31 }
32 
33 //------------------------------------------------------------------------------
34 // Entry point
35 
36 extern void VP8DspInitSSE41(void);
37 
VP8DspInitSSE41(void)38 WEBP_TSAN_IGNORE_FUNCTION void VP8DspInitSSE41(void) {
39   VP8PredLuma16[3] = HE16_SSE41;
40 }
41 
42 #else  // !WEBP_USE_SSE41
43 
44 WEBP_DSP_INIT_STUB(VP8DspInitSSE41)
45 
46 #endif  // WEBP_USE_SSE41
47