Blame src/dsp/dec_sse41.c

Packit 9c6abc
// Copyright 2015 Google Inc. All Rights Reserved.
Packit 9c6abc
//
Packit 9c6abc
// Use of this source code is governed by a BSD-style license
Packit 9c6abc
// that can be found in the COPYING file in the root of the source
Packit 9c6abc
// tree. An additional intellectual property rights grant can be found
Packit 9c6abc
// in the file PATENTS. All contributing project authors may
Packit 9c6abc
// be found in the AUTHORS file in the root of the source tree.
Packit 9c6abc
// -----------------------------------------------------------------------------
Packit 9c6abc
//
Packit 9c6abc
// SSE4 version of some decoding functions.
Packit 9c6abc
//
Packit 9c6abc
// Author: Skal (pascal.massimino@gmail.com)
Packit 9c6abc
Packit 9c6abc
#include "src/dsp/dsp.h"
Packit 9c6abc
Packit 9c6abc
#if defined(WEBP_USE_SSE41)
Packit 9c6abc
Packit 9c6abc
#include <smmintrin.h>
Packit 9c6abc
#include "src/dec/vp8i_dec.h"
Packit 9c6abc
#include "src/utils/utils.h"
Packit 9c6abc
Packit 9c6abc
static void HE16_SSE41(uint8_t* dst) {     // horizontal
Packit 9c6abc
  int j;
Packit 9c6abc
  const __m128i kShuffle3 = _mm_set1_epi8(3);
Packit 9c6abc
  for (j = 16; j > 0; --j) {
Packit 9c6abc
    const __m128i in = _mm_cvtsi32_si128(WebPMemToUint32(dst - 4));
Packit 9c6abc
    const __m128i values = _mm_shuffle_epi8(in, kShuffle3);
Packit 9c6abc
    _mm_storeu_si128((__m128i*)dst, values);
Packit 9c6abc
    dst += BPS;
Packit 9c6abc
  }
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
//------------------------------------------------------------------------------
Packit 9c6abc
// Entry point
Packit 9c6abc
Packit 9c6abc
extern void VP8DspInitSSE41(void);
Packit 9c6abc
Packit 9c6abc
WEBP_TSAN_IGNORE_FUNCTION void VP8DspInitSSE41(void) {
Packit 9c6abc
  VP8PredLuma16[3] = HE16_SSE41;
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
#else  // !WEBP_USE_SSE41
Packit 9c6abc
Packit 9c6abc
WEBP_DSP_INIT_STUB(VP8DspInitSSE41)
Packit 9c6abc
Packit 9c6abc
#endif  // WEBP_USE_SSE41