Blame src/dsp/lossless_enc_mips_dsp_r2.c

Packit 9c6abc
// Copyright 2015 Google Inc. All Rights Reserved.
Packit 9c6abc
//
Packit 9c6abc
// Use of this source code is governed by a BSD-style license
Packit 9c6abc
// that can be found in the COPYING file in the root of the source
Packit 9c6abc
// tree. An additional intellectual property rights grant can be found
Packit 9c6abc
// in the file PATENTS. All contributing project authors may
Packit 9c6abc
// be found in the AUTHORS file in the root of the source tree.
Packit 9c6abc
// -----------------------------------------------------------------------------
Packit 9c6abc
//
Packit 9c6abc
// Image transform methods for lossless encoder.
Packit 9c6abc
//
Packit 9c6abc
// Author(s):  Djordje Pesut    (djordje.pesut@imgtec.com)
Packit 9c6abc
//             Jovan Zelincevic (jovan.zelincevic@imgtec.com)
Packit 9c6abc
Packit 9c6abc
#include "src/dsp/dsp.h"
Packit 9c6abc
Packit 9c6abc
#if defined(WEBP_USE_MIPS_DSP_R2)
Packit 9c6abc
Packit 9c6abc
#include "src/dsp/lossless.h"
Packit 9c6abc
Packit 9c6abc
static void SubtractGreenFromBlueAndRed_MIPSdspR2(uint32_t* argb_data,
Packit 9c6abc
                                                  int num_pixels) {
Packit 9c6abc
  uint32_t temp0, temp1, temp2, temp3, temp4, temp5, temp6, temp7;
Packit 9c6abc
  uint32_t* const p_loop1_end = argb_data + (num_pixels & ~3);
Packit 9c6abc
  uint32_t* const p_loop2_end = p_loop1_end + (num_pixels & 3);
Packit 9c6abc
  __asm__ volatile (
Packit 9c6abc
    ".set       push                                          \n\t"
Packit 9c6abc
    ".set       noreorder                                     \n\t"
Packit 9c6abc
    "beq        %[argb_data],    %[p_loop1_end],     3f       \n\t"
Packit 9c6abc
    " nop                                                     \n\t"
Packit 9c6abc
  "0:                                                         \n\t"
Packit 9c6abc
    "lw         %[temp0],        0(%[argb_data])              \n\t"
Packit 9c6abc
    "lw         %[temp1],        4(%[argb_data])              \n\t"
Packit 9c6abc
    "lw         %[temp2],        8(%[argb_data])              \n\t"
Packit 9c6abc
    "lw         %[temp3],        12(%[argb_data])             \n\t"
Packit 9c6abc
    "ext        %[temp4],        %[temp0],           8,    8  \n\t"
Packit 9c6abc
    "ext        %[temp5],        %[temp1],           8,    8  \n\t"
Packit 9c6abc
    "ext        %[temp6],        %[temp2],           8,    8  \n\t"
Packit 9c6abc
    "ext        %[temp7],        %[temp3],           8,    8  \n\t"
Packit 9c6abc
    "addiu      %[argb_data],    %[argb_data],       16       \n\t"
Packit 9c6abc
    "replv.ph   %[temp4],        %[temp4]                     \n\t"
Packit 9c6abc
    "replv.ph   %[temp5],        %[temp5]                     \n\t"
Packit 9c6abc
    "replv.ph   %[temp6],        %[temp6]                     \n\t"
Packit 9c6abc
    "replv.ph   %[temp7],        %[temp7]                     \n\t"
Packit 9c6abc
    "subu.qb    %[temp0],        %[temp0],           %[temp4] \n\t"
Packit 9c6abc
    "subu.qb    %[temp1],        %[temp1],           %[temp5] \n\t"
Packit 9c6abc
    "subu.qb    %[temp2],        %[temp2],           %[temp6] \n\t"
Packit 9c6abc
    "subu.qb    %[temp3],        %[temp3],           %[temp7] \n\t"
Packit 9c6abc
    "sw         %[temp0],        -16(%[argb_data])            \n\t"
Packit 9c6abc
    "sw         %[temp1],        -12(%[argb_data])            \n\t"
Packit 9c6abc
    "sw         %[temp2],        -8(%[argb_data])             \n\t"
Packit 9c6abc
    "bne        %[argb_data],    %[p_loop1_end],     0b       \n\t"
Packit 9c6abc
    " sw        %[temp3],        -4(%[argb_data])             \n\t"
Packit 9c6abc
  "3:                                                         \n\t"
Packit 9c6abc
    "beq        %[argb_data],    %[p_loop2_end],     2f       \n\t"
Packit 9c6abc
    " nop                                                     \n\t"
Packit 9c6abc
  "1:                                                         \n\t"
Packit 9c6abc
    "lw         %[temp0],        0(%[argb_data])              \n\t"
Packit 9c6abc
    "addiu      %[argb_data],    %[argb_data],       4        \n\t"
Packit 9c6abc
    "ext        %[temp4],        %[temp0],           8,    8  \n\t"
Packit 9c6abc
    "replv.ph   %[temp4],        %[temp4]                     \n\t"
Packit 9c6abc
    "subu.qb    %[temp0],        %[temp0],           %[temp4] \n\t"
Packit 9c6abc
    "bne        %[argb_data],    %[p_loop2_end],     1b       \n\t"
Packit 9c6abc
    " sw        %[temp0],        -4(%[argb_data])             \n\t"
Packit 9c6abc
  "2:                                                         \n\t"
Packit 9c6abc
    ".set       pop                                           \n\t"
Packit 9c6abc
    : [argb_data]"+&r"(argb_data), [temp0]"=&r"(temp0),
Packit 9c6abc
      [temp1]"=&r"(temp1), [temp2]"=&r"(temp2), [temp3]"=&r"(temp3),
Packit 9c6abc
      [temp4]"=&r"(temp4), [temp5]"=&r"(temp5), [temp6]"=&r"(temp6),
Packit 9c6abc
      [temp7]"=&r"(temp7)
Packit 9c6abc
    : [p_loop1_end]"r"(p_loop1_end), [p_loop2_end]"r"(p_loop2_end)
Packit 9c6abc
    : "memory"
Packit 9c6abc
  );
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
static WEBP_INLINE uint32_t ColorTransformDelta(int8_t color_pred,
Packit 9c6abc
                                                int8_t color) {
Packit 9c6abc
  return (uint32_t)((int)(color_pred) * color) >> 5;
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
static void TransformColor_MIPSdspR2(const VP8LMultipliers* const m,
Packit 9c6abc
                                     uint32_t* data, int num_pixels) {
Packit 9c6abc
  int temp0, temp1, temp2, temp3, temp4, temp5;
Packit 9c6abc
  uint32_t argb, argb1, new_red, new_red1;
Packit 9c6abc
  const uint32_t G_to_R = m->green_to_red_;
Packit 9c6abc
  const uint32_t G_to_B = m->green_to_blue_;
Packit 9c6abc
  const uint32_t R_to_B = m->red_to_blue_;
Packit 9c6abc
  uint32_t* const p_loop_end = data + (num_pixels & ~1);
Packit 9c6abc
  __asm__ volatile (
Packit 9c6abc
    ".set            push                                    \n\t"
Packit 9c6abc
    ".set            noreorder                               \n\t"
Packit 9c6abc
    "beq             %[data],      %[p_loop_end],  1f        \n\t"
Packit 9c6abc
    " nop                                                    \n\t"
Packit 9c6abc
    "replv.ph        %[temp0],     %[G_to_R]                 \n\t"
Packit 9c6abc
    "replv.ph        %[temp1],     %[G_to_B]                 \n\t"
Packit 9c6abc
    "replv.ph        %[temp2],     %[R_to_B]                 \n\t"
Packit 9c6abc
    "shll.ph         %[temp0],     %[temp0],       8         \n\t"
Packit 9c6abc
    "shll.ph         %[temp1],     %[temp1],       8         \n\t"
Packit 9c6abc
    "shll.ph         %[temp2],     %[temp2],       8         \n\t"
Packit 9c6abc
    "shra.ph         %[temp0],     %[temp0],       8         \n\t"
Packit 9c6abc
    "shra.ph         %[temp1],     %[temp1],       8         \n\t"
Packit 9c6abc
    "shra.ph         %[temp2],     %[temp2],       8         \n\t"
Packit 9c6abc
  "0:                                                        \n\t"
Packit 9c6abc
    "lw              %[argb],      0(%[data])                \n\t"
Packit 9c6abc
    "lw              %[argb1],     4(%[data])                \n\t"
Packit 9c6abc
    "lhu             %[new_red],   2(%[data])                \n\t"
Packit 9c6abc
    "lhu             %[new_red1],  6(%[data])                \n\t"
Packit 9c6abc
    "precrq.qb.ph    %[temp3],     %[argb],        %[argb1]  \n\t"
Packit 9c6abc
    "precr.qb.ph     %[temp4],     %[argb],        %[argb1]  \n\t"
Packit 9c6abc
    "preceu.ph.qbra  %[temp3],     %[temp3]                  \n\t"
Packit 9c6abc
    "preceu.ph.qbla  %[temp4],     %[temp4]                  \n\t"
Packit 9c6abc
    "shll.ph         %[temp3],     %[temp3],       8         \n\t"
Packit 9c6abc
    "shll.ph         %[temp4],     %[temp4],       8         \n\t"
Packit 9c6abc
    "shra.ph         %[temp3],     %[temp3],       8         \n\t"
Packit 9c6abc
    "shra.ph         %[temp4],     %[temp4],       8         \n\t"
Packit 9c6abc
    "mul.ph          %[temp5],     %[temp3],       %[temp0]  \n\t"
Packit 9c6abc
    "mul.ph          %[temp3],     %[temp3],       %[temp1]  \n\t"
Packit 9c6abc
    "mul.ph          %[temp4],     %[temp4],       %[temp2]  \n\t"
Packit 9c6abc
    "addiu           %[data],      %[data],        8         \n\t"
Packit 9c6abc
    "ins             %[new_red1],  %[new_red],     16,   16  \n\t"
Packit 9c6abc
    "ins             %[argb1],     %[argb],        16,   16  \n\t"
Packit 9c6abc
    "shra.ph         %[temp5],     %[temp5],       5         \n\t"
Packit 9c6abc
    "shra.ph         %[temp3],     %[temp3],       5         \n\t"
Packit 9c6abc
    "shra.ph         %[temp4],     %[temp4],       5         \n\t"
Packit 9c6abc
    "subu.ph         %[new_red1],  %[new_red1],    %[temp5]  \n\t"
Packit 9c6abc
    "subu.ph         %[argb1],     %[argb1],       %[temp3]  \n\t"
Packit 9c6abc
    "preceu.ph.qbra  %[temp5],     %[new_red1]               \n\t"
Packit 9c6abc
    "subu.ph         %[argb1],     %[argb1],       %[temp4]  \n\t"
Packit 9c6abc
    "preceu.ph.qbra  %[temp3],     %[argb1]                  \n\t"
Packit 9c6abc
    "sb              %[temp5],     -2(%[data])               \n\t"
Packit 9c6abc
    "sb              %[temp3],     -4(%[data])               \n\t"
Packit 9c6abc
    "sra             %[temp5],     %[temp5],       16        \n\t"
Packit 9c6abc
    "sra             %[temp3],     %[temp3],       16        \n\t"
Packit 9c6abc
    "sb              %[temp5],     -6(%[data])               \n\t"
Packit 9c6abc
    "bne             %[data],      %[p_loop_end],  0b        \n\t"
Packit 9c6abc
    " sb             %[temp3],     -8(%[data])               \n\t"
Packit 9c6abc
  "1:                                                        \n\t"
Packit 9c6abc
    ".set            pop                                     \n\t"
Packit 9c6abc
    : [temp0]"=&r"(temp0), [temp1]"=&r"(temp1), [temp2]"=&r"(temp2),
Packit 9c6abc
      [temp3]"=&r"(temp3), [temp4]"=&r"(temp4), [temp5]"=&r"(temp5),
Packit 9c6abc
      [new_red1]"=&r"(new_red1), [new_red]"=&r"(new_red),
Packit 9c6abc
      [argb]"=&r"(argb), [argb1]"=&r"(argb1), [data]"+&r"(data)
Packit 9c6abc
    : [G_to_R]"r"(G_to_R), [R_to_B]"r"(R_to_B),
Packit 9c6abc
      [G_to_B]"r"(G_to_B), [p_loop_end]"r"(p_loop_end)
Packit 9c6abc
    : "memory", "hi", "lo"
Packit 9c6abc
  );
Packit 9c6abc
Packit 9c6abc
  if (num_pixels & 1) {
Packit 9c6abc
    const uint32_t argb_ = data[0];
Packit 9c6abc
    const uint32_t green = argb_ >> 8;
Packit 9c6abc
    const uint32_t red = argb_ >> 16;
Packit 9c6abc
    uint32_t new_blue = argb_;
Packit 9c6abc
    new_red = red;
Packit 9c6abc
    new_red -= ColorTransformDelta(m->green_to_red_, green);
Packit 9c6abc
    new_red &= 0xff;
Packit 9c6abc
    new_blue -= ColorTransformDelta(m->green_to_blue_, green);
Packit 9c6abc
    new_blue -= ColorTransformDelta(m->red_to_blue_, red);
Packit 9c6abc
    new_blue &= 0xff;
Packit 9c6abc
    data[0] = (argb_ & 0xff00ff00u) | (new_red << 16) | (new_blue);
Packit 9c6abc
  }
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
static WEBP_INLINE uint8_t TransformColorBlue(uint8_t green_to_blue,
Packit 9c6abc
                                              uint8_t red_to_blue,
Packit 9c6abc
                                              uint32_t argb) {
Packit 9c6abc
  const uint32_t green = argb >> 8;
Packit 9c6abc
  const uint32_t red = argb >> 16;
Packit 9c6abc
  uint8_t new_blue = argb;
Packit 9c6abc
  new_blue -= ColorTransformDelta(green_to_blue, green);
Packit 9c6abc
  new_blue -= ColorTransformDelta(red_to_blue, red);
Packit 9c6abc
  return (new_blue & 0xff);
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
static void CollectColorBlueTransforms_MIPSdspR2(const uint32_t* argb,
Packit 9c6abc
                                                 int stride,
Packit 9c6abc
                                                 int tile_width,
Packit 9c6abc
                                                 int tile_height,
Packit 9c6abc
                                                 int green_to_blue,
Packit 9c6abc
                                                 int red_to_blue,
Packit 9c6abc
                                                 int histo[]) {
Packit 9c6abc
  const int rtb = (red_to_blue << 16) | (red_to_blue & 0xffff);
Packit 9c6abc
  const int gtb = (green_to_blue << 16) | (green_to_blue & 0xffff);
Packit 9c6abc
  const uint32_t mask = 0xff00ffu;
Packit 9c6abc
  while (tile_height-- > 0) {
Packit 9c6abc
    int x;
Packit 9c6abc
    const uint32_t* p_argb = argb;
Packit 9c6abc
    argb += stride;
Packit 9c6abc
    for (x = 0; x < (tile_width >> 1); ++x) {
Packit 9c6abc
      int temp0, temp1, temp2, temp3, temp4, temp5, temp6;
Packit 9c6abc
      __asm__ volatile (
Packit 9c6abc
        "lw           %[temp0],  0(%[p_argb])             \n\t"
Packit 9c6abc
        "lw           %[temp1],  4(%[p_argb])             \n\t"
Packit 9c6abc
        "precr.qb.ph  %[temp2],  %[temp0],  %[temp1]      \n\t"
Packit 9c6abc
        "ins          %[temp1],  %[temp0],  16,    16     \n\t"
Packit 9c6abc
        "shra.ph      %[temp2],  %[temp2],  8             \n\t"
Packit 9c6abc
        "shra.ph      %[temp3],  %[temp1],  8             \n\t"
Packit 9c6abc
        "mul.ph       %[temp5],  %[temp2],  %[rtb]        \n\t"
Packit 9c6abc
        "mul.ph       %[temp6],  %[temp3],  %[gtb]        \n\t"
Packit 9c6abc
        "and          %[temp4],  %[temp1],  %[mask]       \n\t"
Packit 9c6abc
        "addiu        %[p_argb], %[p_argb], 8             \n\t"
Packit 9c6abc
        "shra.ph      %[temp5],  %[temp5],  5             \n\t"
Packit 9c6abc
        "shra.ph      %[temp6],  %[temp6],  5             \n\t"
Packit 9c6abc
        "subu.qb      %[temp2],  %[temp4],  %[temp5]      \n\t"
Packit 9c6abc
        "subu.qb      %[temp2],  %[temp2],  %[temp6]      \n\t"
Packit 9c6abc
        : [p_argb]"+&r"(p_argb), [temp0]"=&r"(temp0), [temp1]"=&r"(temp1),
Packit 9c6abc
          [temp2]"=&r"(temp2), [temp3]"=&r"(temp3), [temp4]"=&r"(temp4),
Packit 9c6abc
          [temp5]"=&r"(temp5), [temp6]"=&r"(temp6)
Packit 9c6abc
        : [rtb]"r"(rtb), [gtb]"r"(gtb), [mask]"r"(mask)
Packit 9c6abc
        : "memory", "hi", "lo"
Packit 9c6abc
      );
Packit 9c6abc
      ++histo[(uint8_t)(temp2 >> 16)];
Packit 9c6abc
      ++histo[(uint8_t)temp2];
Packit 9c6abc
    }
Packit 9c6abc
    if (tile_width & 1) {
Packit 9c6abc
      ++histo[TransformColorBlue(green_to_blue, red_to_blue, *p_argb)];
Packit 9c6abc
    }
Packit 9c6abc
  }
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
static WEBP_INLINE uint8_t TransformColorRed(uint8_t green_to_red,
Packit 9c6abc
                                             uint32_t argb) {
Packit 9c6abc
  const uint32_t green = argb >> 8;
Packit 9c6abc
  uint32_t new_red = argb >> 16;
Packit 9c6abc
  new_red -= ColorTransformDelta(green_to_red, green);
Packit 9c6abc
  return (new_red & 0xff);
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
static void CollectColorRedTransforms_MIPSdspR2(const uint32_t* argb,
Packit 9c6abc
                                                int stride,
Packit 9c6abc
                                                int tile_width,
Packit 9c6abc
                                                int tile_height,
Packit 9c6abc
                                                int green_to_red,
Packit 9c6abc
                                                int histo[]) {
Packit 9c6abc
  const int gtr = (green_to_red << 16) | (green_to_red & 0xffff);
Packit 9c6abc
  while (tile_height-- > 0) {
Packit 9c6abc
    int x;
Packit 9c6abc
    const uint32_t* p_argb = argb;
Packit 9c6abc
    argb += stride;
Packit 9c6abc
    for (x = 0; x < (tile_width >> 1); ++x) {
Packit 9c6abc
      int temp0, temp1, temp2, temp3, temp4;
Packit 9c6abc
      __asm__ volatile (
Packit 9c6abc
        "lw           %[temp0],  0(%[p_argb])             \n\t"
Packit 9c6abc
        "lw           %[temp1],  4(%[p_argb])             \n\t"
Packit 9c6abc
        "precrq.ph.w  %[temp4],  %[temp0],  %[temp1]      \n\t"
Packit 9c6abc
        "ins          %[temp1],  %[temp0],  16,    16     \n\t"
Packit 9c6abc
        "shra.ph      %[temp3],  %[temp1],  8             \n\t"
Packit 9c6abc
        "mul.ph       %[temp2],  %[temp3],  %[gtr]        \n\t"
Packit 9c6abc
        "addiu        %[p_argb], %[p_argb], 8             \n\t"
Packit 9c6abc
        "shra.ph      %[temp2],  %[temp2],  5             \n\t"
Packit 9c6abc
        "subu.qb      %[temp2],  %[temp4],  %[temp2]      \n\t"
Packit 9c6abc
        : [p_argb]"+&r"(p_argb), [temp0]"=&r"(temp0), [temp1]"=&r"(temp1),
Packit 9c6abc
          [temp2]"=&r"(temp2), [temp3]"=&r"(temp3), [temp4]"=&r"(temp4)
Packit 9c6abc
        : [gtr]"r"(gtr)
Packit 9c6abc
        : "memory", "hi", "lo"
Packit 9c6abc
      );
Packit 9c6abc
      ++histo[(uint8_t)(temp2 >> 16)];
Packit 9c6abc
      ++histo[(uint8_t)temp2];
Packit 9c6abc
    }
Packit 9c6abc
    if (tile_width & 1) {
Packit 9c6abc
      ++histo[TransformColorRed(green_to_red, *p_argb)];
Packit 9c6abc
    }
Packit 9c6abc
  }
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
//------------------------------------------------------------------------------
Packit 9c6abc
// Entry point
Packit 9c6abc
Packit 9c6abc
extern void VP8LEncDspInitMIPSdspR2(void);
Packit 9c6abc
Packit 9c6abc
WEBP_TSAN_IGNORE_FUNCTION void VP8LEncDspInitMIPSdspR2(void) {
Packit 9c6abc
  VP8LSubtractGreenFromBlueAndRed = SubtractGreenFromBlueAndRed_MIPSdspR2;
Packit 9c6abc
  VP8LTransformColor = TransformColor_MIPSdspR2;
Packit 9c6abc
  VP8LCollectColorBlueTransforms = CollectColorBlueTransforms_MIPSdspR2;
Packit 9c6abc
  VP8LCollectColorRedTransforms = CollectColorRedTransforms_MIPSdspR2;
Packit 9c6abc
}
Packit 9c6abc
Packit 9c6abc
#else  // !WEBP_USE_MIPS_DSP_R2
Packit 9c6abc
Packit 9c6abc
WEBP_DSP_INIT_STUB(VP8LEncDspInitMIPSdspR2)
Packit 9c6abc
Packit 9c6abc
#endif  // WEBP_USE_MIPS_DSP_R2