Merge commit '0801853e640624537db386727b36fa97aa6258e7'

[ffmpeg] / libavcodec / vp8dsp.c
diff --git a/libavcodec/vp8dsp.c b/libavcodec/vp8dsp.c

index ac9a6affc9b509184d7e1e4e10b34423380bbcf7..4ff63d078425873ba9280efc6e564a935a89de1c 100644 (file)
--- a/libavcodec/vp8dsp.c
+++ b/libavcodec/vp8dsp.c
@@ -3,20 +3,20 @@
   * Copyright (C) 2010 Ronald S. Bultje
   * Copyright (C) 2014 Peter Ross
   *
- * This file is part of Libav.
+ * This file is part of FFmpeg.
   *
- * Libav is free software; you can redistribute it and/or
+ * FFmpeg is free software; you can redistribute it and/or
   * modify it under the terms of the GNU Lesser General Public
   * License as published by the Free Software Foundation; either
   * version 2.1 of the License, or (at your option) any later version.
   *
- * Libav is distributed in the hope that it will be useful,
+ * FFmpeg is distributed in the hope that it will be useful,
   * but WITHOUT ANY WARRANTY; without even the implied warranty of
   * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   * Lesser General Public License for more details.
   *
   * You should have received a copy of the GNU Lesser General Public
- * License along with Libav; if not, write to the Free Software
+ * License along with FFmpeg; if not, write to the Free Software
   * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
   */
  
@@ -26,6 +26,7 @@
   */
  
  #include "libavutil/common.h"
+#include "libavutil/intreadwrite.h"
  
  #include "mathops.h"
  #include "vp8dsp.h"
@@ -52,7 +53,8 @@ static void name ## _idct_dc_add4y_c(uint8_t *dst, int16_t block[4][16],      \
  #if CONFIG_VP7_DECODER
  static void vp7_luma_dc_wht_c(int16_t block[4][4][16], int16_t dc[16])
  {
-    int i, a1, b1, c1, d1;
+    int i;
+    unsigned a1, b1, c1, d1;
      int16_t tmp[16];
  
      for (i = 0; i < 4; i++) {
@@ -60,10 +62,10 @@ static void vp7_luma_dc_wht_c(int16_t block[4][4][16], int16_t dc[16])
          b1 = (dc[i * 4 + 0] - dc[i * 4 + 2]) * 23170;
          c1 = dc[i * 4 + 1] * 12540 - dc[i * 4 + 3] * 30274;
          d1 = dc[i * 4 + 1] * 30274 + dc[i * 4 + 3] * 12540;
-        tmp[i * 4 + 0] = (a1 + d1) >> 14;
-        tmp[i * 4 + 3] = (a1 - d1) >> 14;
-        tmp[i * 4 + 1] = (b1 + c1) >> 14;
-        tmp[i * 4 + 2] = (b1 - c1) >> 14;
+        tmp[i * 4 + 0] = (int)(a1 + d1) >> 14;
+        tmp[i * 4 + 3] = (int)(a1 - d1) >> 14;
+        tmp[i * 4 + 1] = (int)(b1 + c1) >> 14;
+        tmp[i * 4 + 2] = (int)(b1 - c1) >> 14;
      }
  
      for (i = 0; i < 4; i++) {
@@ -71,14 +73,11 @@ static void vp7_luma_dc_wht_c(int16_t block[4][4][16], int16_t dc[16])
          b1 = (tmp[i + 0] - tmp[i + 8]) * 23170;
          c1 = tmp[i + 4] * 12540 - tmp[i + 12] * 30274;
          d1 = tmp[i + 4] * 30274 + tmp[i + 12] * 12540;
-        dc[i * 4 + 0] = 0;
-        dc[i * 4 + 1] = 0;
-        dc[i * 4 + 2] = 0;
-        dc[i * 4 + 3] = 0;
-        block[0][i][0] = (a1 + d1 + 0x20000) >> 18;
-        block[3][i][0] = (a1 - d1 + 0x20000) >> 18;
-        block[1][i][0] = (b1 + c1 + 0x20000) >> 18;
-        block[2][i][0] = (b1 - c1 + 0x20000) >> 18;
+        AV_ZERO64(dc + i * 4);
+        block[0][i][0] = (int)(a1 + d1 + 0x20000) >> 18;
+        block[3][i][0] = (int)(a1 - d1 + 0x20000) >> 18;
+        block[1][i][0] = (int)(b1 + c1 + 0x20000) >> 18;
+        block[2][i][0] = (int)(b1 - c1 + 0x20000) >> 18;
      }
  }
  
@@ -97,7 +96,8 @@ static void vp7_luma_dc_wht_dc_c(int16_t block[4][4][16], int16_t dc[16])
  
  static void vp7_idct_add_c(uint8_t *dst, int16_t block[16], ptrdiff_t stride)
  {
-    int i, a1, b1, c1, d1;
+    int i;
+    unsigned a1, b1, c1, d1;
      int16_t tmp[16];
  
      for (i = 0; i < 4; i++) {
@@ -105,14 +105,11 @@ static void vp7_idct_add_c(uint8_t *dst, int16_t block[16], ptrdiff_t stride)
          b1 = (block[i * 4 + 0] - block[i * 4 + 2]) * 23170;
          c1 = block[i * 4 + 1] * 12540 - block[i * 4 + 3] * 30274;
          d1 = block[i * 4 + 1] * 30274 + block[i * 4 + 3] * 12540;
-        block[i * 4 + 0] = 0;
-        block[i * 4 + 1] = 0;
-        block[i * 4 + 2] = 0;
-        block[i * 4 + 3] = 0;
-        tmp[i * 4 + 0] = (a1 + d1) >> 14;
-        tmp[i * 4 + 3] = (a1 - d1) >> 14;
-        tmp[i * 4 + 1] = (b1 + c1) >> 14;
-        tmp[i * 4 + 2] = (b1 - c1) >> 14;
+        AV_ZERO64(block + i * 4);
+        tmp[i * 4 + 0] = (int)(a1 + d1) >> 14;
+        tmp[i * 4 + 3] = (int)(a1 - d1) >> 14;
+        tmp[i * 4 + 1] = (int)(b1 + c1) >> 14;
+        tmp[i * 4 + 2] = (int)(b1 - c1) >> 14;
      }
  
      for (i = 0; i < 4; i++) {
@@ -121,13 +118,13 @@ static void vp7_idct_add_c(uint8_t *dst, int16_t block[16], ptrdiff_t stride)
          c1 = tmp[i + 4] * 12540 - tmp[i + 12] * 30274;
          d1 = tmp[i + 4] * 30274 + tmp[i + 12] * 12540;
          dst[0 * stride + i] = av_clip_uint8(dst[0 * stride + i] +
-                                            ((a1 + d1 + 0x20000) >> 18));
+                                            ((int)(a1 + d1 + 0x20000) >> 18));
          dst[3 * stride + i] = av_clip_uint8(dst[3 * stride + i] +
-                                            ((a1 - d1 + 0x20000) >> 18));
+                                            ((int)(a1 - d1 + 0x20000) >> 18));
          dst[1 * stride + i] = av_clip_uint8(dst[1 * stride + i] +
-                                            ((b1 + c1 + 0x20000) >> 18));
+                                            ((int)(b1 + c1 + 0x20000) >> 18));
          dst[2 * stride + i] = av_clip_uint8(dst[2 * stride + i] +
-                                            ((b1 - c1 + 0x20000) >> 18));
+                                            ((int)(b1 - c1 + 0x20000) >> 18));
      }
  }
  
@@ -171,10 +168,7 @@ static void vp8_luma_dc_wht_c(int16_t block[4][4][16], int16_t dc[16])
          t1 = dc[i * 4 + 1] + dc[i * 4 + 2];
          t2 = dc[i * 4 + 1] - dc[i * 4 + 2];
          t3 = dc[i * 4 + 0] - dc[i * 4 + 3] + 3; // rounding
-        dc[i * 4 + 0] = 0;
-        dc[i * 4 + 1] = 0;
-        dc[i * 4 + 2] = 0;
-        dc[i * 4 + 3] = 0;
+        AV_ZERO64(dc + i * 4);
  
          block[i][0][0] = (t0 + t1) >> 3;
          block[i][1][0] = (t3 + t2) >> 3;
@@ -262,7 +256,7 @@ MK_IDCT_DC_ADD4_C(vp8)
      int av_unused q2 = p[ 2 * stride];                                        \
      int av_unused q3 = p[ 3 * stride];
  
-#define clip_int8(n) (cm[n + 0x80] - 0x80)
+#define clip_int8(n) (cm[(n) + 0x80] - 0x80)
  
  static av_always_inline void filter_common(uint8_t *p, ptrdiff_t stride,
                                             int is4tap, int is_vp7)
@@ -747,5 +741,7 @@ av_cold void ff_vp8dsp_init(VP8DSPContext *dsp)
          ff_vp8dsp_init_arm(dsp);
      if (ARCH_X86)
          ff_vp8dsp_init_x86(dsp);
+    if (ARCH_MIPS)
+        ff_vp8dsp_init_mips(dsp);
  }
  #endif /* CONFIG_VP8_DECODER */