]> git.sesse.net Git - ffmpeg/commitdiff
avcodec/qtrle : 32bpp dec copy two raw argb value at the same time
authorMartin Vignali <martin.vignali@gmail.com>
Tue, 26 Feb 2019 09:38:10 +0000 (10:38 +0100)
committerMartin Vignali <martin.vignali@gmail.com>
Mon, 4 Mar 2019 12:03:42 +0000 (13:03 +0100)
benchmark on x86_64 :
38 fps -> 40 fps

libavcodec/qtrle.c

index bb55ba8a86aac100a664451792904fd12d2bb975..febfea30292309d902bd3229e7a8bd9767283b33 100644 (file)
@@ -346,7 +346,7 @@ static void qtrle_decode_24bpp(QtrleContext *s, int row_ptr, int lines_to_change
 
 static void qtrle_decode_32bpp(QtrleContext *s, int row_ptr, int lines_to_change)
 {
-    int rle_code;
+    int rle_code, rle_code_half;
     int pixel_ptr;
     int row_inc = s->frame->linesize[0];
     unsigned int argb;
@@ -379,10 +379,15 @@ static void qtrle_decode_32bpp(QtrleContext *s, int row_ptr, int lines_to_change
                 CHECK_PIXEL_PTR(rle_code * 4);
 
                 /* copy pixels directly to output */
-                while (rle_code--) {
-                    argb = bytestream2_get_ne32(&s->g);
-                    AV_WN32A(rgb + pixel_ptr, argb);
-                    pixel_ptr  += 4;
+                rle_code_half = rle_code / 2;
+                while (rle_code_half--) { /* copy 2 argb raw value at the same time */
+                    AV_WN64A(rgb + pixel_ptr, bytestream2_get_ne64(&s->g));
+                    pixel_ptr += 8;
+                }
+
+                if (rle_code % 2 != 0){ /* not even raw value */
+                    AV_WN32A(rgb + pixel_ptr, bytestream2_get_ne32(&s->g));
+                    pixel_ptr += 4;
                 }
             }
         }