x86: mmx2 ---> mmxext in variable names

[ffmpeg] / libswscale / x86 / swscale_template.c
diff --git a/libswscale/x86/swscale_template.c b/libswscale/x86/swscale_template.c

index ae05c0b50656c7024853b9e1ec0af1b23e4b35c5..d7a2fdbe18297c17a10ed154e41e0a0d6a74e95a 100644 (file)
--- a/libswscale/x86/swscale_template.c
+++ b/libswscale/x86/swscale_template.c
@@ -22,13 +22,13 @@
  #undef MOVNTQ
  #undef PREFETCH
  
-#if COMPILE_TEMPLATE_MMX2
+#if COMPILE_TEMPLATE_MMXEXT
  #define PREFETCH "prefetchnta"
  #else
  #define PREFETCH  " # nop"
  #endif
  
-#if COMPILE_TEMPLATE_MMX2
+#if COMPILE_TEMPLATE_MMXEXT
  #define REAL_MOVNTQ(a,b) "movntq " #a ", " #b " \n\t"
  #else
  #define REAL_MOVNTQ(a,b) "movq " #a ", " #b " \n\t"
@@ -268,7 +268,7 @@ static void RENAME(yuv2rgb32_X_ar)(SwsContext *c, const int16_t *lumFilter,
          "movq                      %%mm2, "U_TEMP"(%0)  \n\t"
          "movq                      %%mm4, "V_TEMP"(%0)  \n\t"
          "movq                      %%mm5, "Y_TEMP"(%0)  \n\t"
-        YSCALEYUV2PACKEDX_ACCURATE_YA(LUM_MMX_FILTER_OFFSET)
+        YSCALEYUV2PACKEDX_ACCURATE_YA(ALP_MMX_FILTER_OFFSET)
          "movq               "Y_TEMP"(%0), %%mm5         \n\t"
          "psraw                        $3, %%mm1         \n\t"
          "psraw                        $3, %%mm7         \n\t"
@@ -298,7 +298,7 @@ static void RENAME(yuv2rgb32_X)(SwsContext *c, const int16_t *lumFilter,
      if (CONFIG_SWSCALE_ALPHA && c->alpPixBuf) {
          YSCALEYUV2PACKEDX
          YSCALEYUV2RGBX
-        YSCALEYUV2PACKEDX_YA(LUM_MMX_FILTER_OFFSET, %%mm0, %%mm3, %%mm6, %%mm1, %%mm7)
+        YSCALEYUV2PACKEDX_YA(ALP_MMX_FILTER_OFFSET, %%mm0, %%mm3, %%mm6, %%mm1, %%mm7)
          "psraw                        $3, %%mm1         \n\t"
          "psraw                        $3, %%mm7         \n\t"
          "packuswb                  %%mm7, %%mm1         \n\t"
@@ -567,7 +567,7 @@ static void RENAME(yuv2rgb555_X)(SwsContext *c, const int16_t *lumFilter,
      "cmp  "#dstw", "#index"     \n\t"\
      " jb       1b               \n\t"
  
-#if COMPILE_TEMPLATE_MMX2
+#if COMPILE_TEMPLATE_MMXEXT
  #undef WRITEBGR24
  #define WRITEBGR24(dst, dstw, index)  WRITEBGR24MMX2(dst, dstw, index)
  #else
@@ -1088,14 +1088,15 @@ static void RENAME(yuv2yuyv422_2)(SwsContext *c, const int16_t *buf[2],
   * YV12 to RGB without scaling or interpolating
   */
  static void RENAME(yuv2rgb32_1)(SwsContext *c, const int16_t *buf0,
-                                const int16_t *ubuf[2], const int16_t *bguf[2],
+                                const int16_t *ubuf[2], const int16_t *vbuf[2],
                                  const int16_t *abuf0, uint8_t *dest,
                                  int dstW, int uvalpha, int y)
  {
-    const int16_t *ubuf0 = ubuf[0], *ubuf1 = ubuf[1];
+    const int16_t *ubuf0 = ubuf[0];
      const int16_t *buf1= buf0; //FIXME needed for RGB1/BGR1
  
      if (uvalpha < 2048) { // note this is not correct (shifts chrominance by 0.5 pixels) but it is a bit faster
+        const int16_t *ubuf1 = ubuf[0];
          if (CONFIG_SWSCALE_ALPHA && c->alpPixBuf) {
              __asm__ volatile(
                  "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
@@ -1124,6 +1125,7 @@ static void RENAME(yuv2rgb32_1)(SwsContext *c, const int16_t *buf0,
              );
          }
      } else {
+        const int16_t *ubuf1 = ubuf[1];
          if (CONFIG_SWSCALE_ALPHA && c->alpPixBuf) {
              __asm__ volatile(
                  "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
@@ -1155,14 +1157,15 @@ static void RENAME(yuv2rgb32_1)(SwsContext *c, const int16_t *buf0,
  }
  
  static void RENAME(yuv2bgr24_1)(SwsContext *c, const int16_t *buf0,
-                                const int16_t *ubuf[2], const int16_t *bguf[2],
+                                const int16_t *ubuf[2], const int16_t *vbuf[2],
                                  const int16_t *abuf0, uint8_t *dest,
                                  int dstW, int uvalpha, int y)
  {
-    const int16_t *ubuf0 = ubuf[0], *ubuf1 = ubuf[1];
+    const int16_t *ubuf0 = ubuf[0];
      const int16_t *buf1= buf0; //FIXME needed for RGB1/BGR1
  
      if (uvalpha < 2048) { // note this is not correct (shifts chrominance by 0.5 pixels) but it is a bit faster
+        const int16_t *ubuf1 = ubuf[0];
          __asm__ volatile(
              "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
              "mov        %4, %%"REG_b"               \n\t"
@@ -1176,6 +1179,7 @@ static void RENAME(yuv2bgr24_1)(SwsContext *c, const int16_t *buf0,
                 "a" (&c->redDither)
          );
      } else {
+        const int16_t *ubuf1 = ubuf[1];
          __asm__ volatile(
              "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
              "mov        %4, %%"REG_b"               \n\t"
@@ -1192,14 +1196,15 @@ static void RENAME(yuv2bgr24_1)(SwsContext *c, const int16_t *buf0,
  }
  
  static void RENAME(yuv2rgb555_1)(SwsContext *c, const int16_t *buf0,
-                                 const int16_t *ubuf[2], const int16_t *bguf[2],
+                                 const int16_t *ubuf[2], const int16_t *vbuf[2],
                                   const int16_t *abuf0, uint8_t *dest,
                                   int dstW, int uvalpha, int y)
  {
-    const int16_t *ubuf0 = ubuf[0], *ubuf1 = ubuf[1];
+    const int16_t *ubuf0 = ubuf[0];
      const int16_t *buf1= buf0; //FIXME needed for RGB1/BGR1
  
      if (uvalpha < 2048) { // note this is not correct (shifts chrominance by 0.5 pixels) but it is a bit faster
+        const int16_t *ubuf1 = ubuf[0];
          __asm__ volatile(
              "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
              "mov        %4, %%"REG_b"               \n\t"
@@ -1219,6 +1224,7 @@ static void RENAME(yuv2rgb555_1)(SwsContext *c, const int16_t *buf0,
                 "a" (&c->redDither)
          );
      } else {
+        const int16_t *ubuf1 = ubuf[1];
          __asm__ volatile(
              "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
              "mov        %4, %%"REG_b"               \n\t"
@@ -1241,14 +1247,15 @@ static void RENAME(yuv2rgb555_1)(SwsContext *c, const int16_t *buf0,
  }
  
  static void RENAME(yuv2rgb565_1)(SwsContext *c, const int16_t *buf0,
-                                 const int16_t *ubuf[2], const int16_t *bguf[2],
+                                 const int16_t *ubuf[2], const int16_t *vbuf[2],
                                   const int16_t *abuf0, uint8_t *dest,
                                   int dstW, int uvalpha, int y)
  {
-    const int16_t *ubuf0 = ubuf[0], *ubuf1 = ubuf[1];
+    const int16_t *ubuf0 = ubuf[0];
      const int16_t *buf1= buf0; //FIXME needed for RGB1/BGR1
  
      if (uvalpha < 2048) { // note this is not correct (shifts chrominance by 0.5 pixels) but it is a bit faster
+        const int16_t *ubuf1 = ubuf[0];
          __asm__ volatile(
              "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
              "mov        %4, %%"REG_b"               \n\t"
@@ -1268,6 +1275,7 @@ static void RENAME(yuv2rgb565_1)(SwsContext *c, const int16_t *buf0,
                 "a" (&c->redDither)
          );
      } else {
+        const int16_t *ubuf1 = ubuf[1];
          __asm__ volatile(
              "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
              "mov        %4, %%"REG_b"               \n\t"
@@ -1327,14 +1335,15 @@ static void RENAME(yuv2rgb565_1)(SwsContext *c, const int16_t *buf0,
  #define YSCALEYUV2PACKED1b(index, c)  REAL_YSCALEYUV2PACKED1b(index, c)
  
  static void RENAME(yuv2yuyv422_1)(SwsContext *c, const int16_t *buf0,
-                                  const int16_t *ubuf[2], const int16_t *bguf[2],
+                                  const int16_t *ubuf[2], const int16_t *vbuf[2],
                                    const int16_t *abuf0, uint8_t *dest,
                                    int dstW, int uvalpha, int y)
  {
-    const int16_t *ubuf0 = ubuf[0], *ubuf1 = ubuf[1];
+    const int16_t *ubuf0 = ubuf[0];
      const int16_t *buf1= buf0; //FIXME needed for RGB1/BGR1
  
      if (uvalpha < 2048) { // note this is not correct (shifts chrominance by 0.5 pixels) but it is a bit faster
+        const int16_t *ubuf1 = ubuf[0];
          __asm__ volatile(
              "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
              "mov        %4, %%"REG_b"               \n\t"
@@ -1347,6 +1356,7 @@ static void RENAME(yuv2yuyv422_1)(SwsContext *c, const int16_t *buf0,
                 "a" (&c->redDither)
          );
      } else {
+        const int16_t *ubuf1 = ubuf[1];
          __asm__ volatile(
              "mov %%"REG_b", "ESP_OFFSET"(%5)        \n\t"
              "mov        %4, %%"REG_b"               \n\t"
@@ -1361,14 +1371,14 @@ static void RENAME(yuv2yuyv422_1)(SwsContext *c, const int16_t *buf0,
      }
  }
  
-#if COMPILE_TEMPLATE_MMX2
+#if COMPILE_TEMPLATE_MMXEXT
  static void RENAME(hyscale_fast)(SwsContext *c, int16_t *dst,
                                   int dstWidth, const uint8_t *src,
                                   int srcW, int xInc)
  {
-    int16_t *filterPos = c->hLumFilterPos;
+    int32_t *filterPos = c->hLumFilterPos;
      int16_t *filter    = c->hLumFilter;
-    void    *mmx2FilterCode= c->lumMmx2FilterCode;
+    void    *mmxextFilterCode = c->lumMmxextFilterCode;
      int i;
  #if defined(PIC)
      uint64_t ebxsave;
@@ -1441,7 +1451,7 @@ static void RENAME(hyscale_fast)(SwsContext *c, int16_t *dst,
  #endif
  #endif
          :: "m" (src), "m" (dst), "m" (filter), "m" (filterPos),
-           "m" (mmx2FilterCode)
+           "m" (mmxextFilterCode)
  #if defined(PIC)
            ,"m" (ebxsave)
  #endif
@@ -1462,9 +1472,9 @@ static void RENAME(hcscale_fast)(SwsContext *c, int16_t *dst1, int16_t *dst2,
                                   int dstWidth, const uint8_t *src1,
                                   const uint8_t *src2, int srcW, int xInc)
  {
-    int16_t *filterPos = c->hChrFilterPos;
+    int32_t *filterPos = c->hChrFilterPos;
      int16_t *filter    = c->hChrFilter;
-    void    *mmx2FilterCode= c->chrMmx2FilterCode;
+    void    *mmxextFilterCode = c->chrMmxextFilterCode;
      int i;
  #if defined(PIC)
      DECLARE_ALIGNED(8, uint64_t, ebxsave);
@@ -1525,7 +1535,7 @@ static void RENAME(hcscale_fast)(SwsContext *c, int16_t *dst1, int16_t *dst2,
  #endif
  #endif
          :: "m" (src1), "m" (dst1), "m" (filter), "m" (filterPos),
-           "m" (mmx2FilterCode), "m" (src2), "m"(dst2)
+           "m" (mmxextFilterCode), "m" (src2), "m"(dst2)
  #if defined(PIC)
            ,"m" (ebxsave)
  #endif
@@ -1543,34 +1553,34 @@ static void RENAME(hcscale_fast)(SwsContext *c, int16_t *dst1, int16_t *dst2,
          dst2[i] = src2[srcW-1]*128;
      }
  }
-#endif /* COMPILE_TEMPLATE_MMX2 */
+#endif /* COMPILE_TEMPLATE_MMXEXT */
  
  static av_cold void RENAME(sws_init_swScale)(SwsContext *c)
  {
-    enum PixelFormat dstFormat = c->dstFormat;
+    enum AVPixelFormat dstFormat = c->dstFormat;
  
      if (!is16BPS(dstFormat) && !is9_OR_10BPS(dstFormat) &&
-        dstFormat != PIX_FMT_NV12 && dstFormat != PIX_FMT_NV21) {
+        dstFormat != AV_PIX_FMT_NV12 && dstFormat != AV_PIX_FMT_NV21) {
          if (!(c->flags & SWS_BITEXACT)) {
              if (c->flags & SWS_ACCURATE_RND) {
                  if (!(c->flags & SWS_FULL_CHR_H_INT)) {
                      switch (c->dstFormat) {
-                    case PIX_FMT_RGB32:   c->yuv2packedX = RENAME(yuv2rgb32_X_ar);   break;
-                    case PIX_FMT_BGR24:   c->yuv2packedX = RENAME(yuv2bgr24_X_ar);   break;
-                    case PIX_FMT_RGB555:  c->yuv2packedX = RENAME(yuv2rgb555_X_ar);  break;
-                    case PIX_FMT_RGB565:  c->yuv2packedX = RENAME(yuv2rgb565_X_ar);  break;
-                    case PIX_FMT_YUYV422: c->yuv2packedX = RENAME(yuv2yuyv422_X_ar); break;
+                    case AV_PIX_FMT_RGB32:   c->yuv2packedX = RENAME(yuv2rgb32_X_ar);   break;
+                    case AV_PIX_FMT_BGR24:   c->yuv2packedX = RENAME(yuv2bgr24_X_ar);   break;
+                    case AV_PIX_FMT_RGB555:  c->yuv2packedX = RENAME(yuv2rgb555_X_ar);  break;
+                    case AV_PIX_FMT_RGB565:  c->yuv2packedX = RENAME(yuv2rgb565_X_ar);  break;
+                    case AV_PIX_FMT_YUYV422: c->yuv2packedX = RENAME(yuv2yuyv422_X_ar); break;
                      default: break;
                      }
                  }
              } else {
                  if (!(c->flags & SWS_FULL_CHR_H_INT)) {
                      switch (c->dstFormat) {
-                    case PIX_FMT_RGB32:   c->yuv2packedX = RENAME(yuv2rgb32_X);   break;
-                    case PIX_FMT_BGR24:   c->yuv2packedX = RENAME(yuv2bgr24_X);   break;
-                    case PIX_FMT_RGB555:  c->yuv2packedX = RENAME(yuv2rgb555_X);  break;
-                    case PIX_FMT_RGB565:  c->yuv2packedX = RENAME(yuv2rgb565_X);  break;
-                    case PIX_FMT_YUYV422: c->yuv2packedX = RENAME(yuv2yuyv422_X); break;
+                    case AV_PIX_FMT_RGB32:   c->yuv2packedX = RENAME(yuv2rgb32_X);   break;
+                    case AV_PIX_FMT_BGR24:   c->yuv2packedX = RENAME(yuv2bgr24_X);   break;
+                    case AV_PIX_FMT_RGB555:  c->yuv2packedX = RENAME(yuv2rgb555_X);  break;
+                    case AV_PIX_FMT_RGB565:  c->yuv2packedX = RENAME(yuv2rgb565_X);  break;
+                    case AV_PIX_FMT_YUYV422: c->yuv2packedX = RENAME(yuv2yuyv422_X); break;
                      default: break;
                      }
                  }
@@ -1578,23 +1588,23 @@ static av_cold void RENAME(sws_init_swScale)(SwsContext *c)
          }
          if (!(c->flags & SWS_FULL_CHR_H_INT)) {
              switch (c->dstFormat) {
-            case PIX_FMT_RGB32:
+            case AV_PIX_FMT_RGB32:
                  c->yuv2packed1 = RENAME(yuv2rgb32_1);
                  c->yuv2packed2 = RENAME(yuv2rgb32_2);
                  break;
-            case PIX_FMT_BGR24:
+            case AV_PIX_FMT_BGR24:
                  c->yuv2packed1 = RENAME(yuv2bgr24_1);
                  c->yuv2packed2 = RENAME(yuv2bgr24_2);
                  break;
-            case PIX_FMT_RGB555:
+            case AV_PIX_FMT_RGB555:
                  c->yuv2packed1 = RENAME(yuv2rgb555_1);
                  c->yuv2packed2 = RENAME(yuv2rgb555_2);
                  break;
-            case PIX_FMT_RGB565:
+            case AV_PIX_FMT_RGB565:
                  c->yuv2packed1 = RENAME(yuv2rgb565_1);
                  c->yuv2packed2 = RENAME(yuv2rgb565_2);
                  break;
-            case PIX_FMT_YUYV422:
+            case AV_PIX_FMT_YUYV422:
                  c->yuv2packed1 = RENAME(yuv2yuyv422_1);
                  c->yuv2packed2 = RENAME(yuv2yuyv422_2);
                  break;
@@ -1605,18 +1615,17 @@ static av_cold void RENAME(sws_init_swScale)(SwsContext *c)
      }
  
      if (c->srcBpc == 8 && c->dstBpc <= 10) {
-    // Use the new MMX scaler if the MMX2 one can't be used (it is faster than the x86 ASM one).
-#if COMPILE_TEMPLATE_MMX2
-    if (c->flags & SWS_FAST_BILINEAR && c->canMMX2BeUsed)
-    {
+    // Use the new MMX scaler if the MMXEXT one can't be used (it is faster than the x86 ASM one).
+#if COMPILE_TEMPLATE_MMXEXT
+    if (c->flags & SWS_FAST_BILINEAR && c->canMMXEXTBeUsed) {
          c->hyscale_fast = RENAME(hyscale_fast);
          c->hcscale_fast = RENAME(hcscale_fast);
      } else {
-#endif /* COMPILE_TEMPLATE_MMX2 */
+#endif /* COMPILE_TEMPLATE_MMXEXT */
          c->hyscale_fast = NULL;
          c->hcscale_fast = NULL;
-#if COMPILE_TEMPLATE_MMX2
+#if COMPILE_TEMPLATE_MMXEXT
      }
-#endif /* COMPILE_TEMPLATE_MMX2 */
+#endif /* COMPILE_TEMPLATE_MMXEXT */
      }
  }