[FFmpeg-cvslog] r16202 - trunk/libavcodec/h264pred.c

lorenm subversion
Thu Dec 18 02:05:07 CET 2008


Author: lorenm
Date: Thu Dec 18 02:05:06 2008
New Revision: 16202

Log:
1.6x faster pred*_vertical_add_c


Modified:
   trunk/libavcodec/h264pred.c

Modified: trunk/libavcodec/h264pred.c
==============================================================================
--- trunk/libavcodec/h264pred.c	(original)
+++ trunk/libavcodec/h264pred.c	Thu Dec 18 02:05:06 2008
@@ -989,23 +989,26 @@ static void pred8x8l_horizontal_up_c(uin
 
 static void pred4x4_vertical_add_c(uint8_t *pix, const DCTELEM *block, int stride){
     int i;
+    pix -= stride;
     for(i=0; i<4; i++){
-        pix[0]= pix[0-stride] + block[0];
-        pix[1]= pix[1-stride] + block[1];
-        pix[2]= pix[2-stride] + block[2];
-        pix[3]= pix[3-stride] + block[3];
-        pix+= stride;
-        block+= 4;
+        uint8_t v = pix[0];
+        pix[1*stride]= v += block[0];
+        pix[2*stride]= v += block[4];
+        pix[3*stride]= v += block[8];
+        pix[4*stride]= v += block[12];
+        pix++;
+        block++;
     }
 }
 
 static void pred4x4_horizontal_add_c(uint8_t *pix, const DCTELEM *block, int stride){
     int i;
     for(i=0; i<4; i++){
-        pix[0]= pix[-1] + block[0];
-        pix[1]= pix[ 0] + block[1];
-        pix[2]= pix[ 1] + block[2];
-        pix[3]= pix[ 2] + block[3];
+        uint8_t v = pix[-1];
+        pix[0]= v += block[0];
+        pix[1]= v += block[1];
+        pix[2]= v += block[2];
+        pix[3]= v += block[3];
         pix+= stride;
         block+= 4;
     }
@@ -1013,31 +1016,34 @@ static void pred4x4_horizontal_add_c(uin
 
 static void pred8x8l_vertical_add_c(uint8_t *pix, const DCTELEM *block, int stride){
     int i;
+    pix -= stride;
     for(i=0; i<8; i++){
-        pix[0]= pix[0-stride] + block[0];
-        pix[1]= pix[1-stride] + block[1];
-        pix[2]= pix[2-stride] + block[2];
-        pix[3]= pix[3-stride] + block[3];
-        pix[4]= pix[4-stride] + block[4];
-        pix[5]= pix[5-stride] + block[5];
-        pix[6]= pix[6-stride] + block[6];
-        pix[7]= pix[7-stride] + block[7];
-        pix+= stride;
-        block+= 8;
+        uint8_t v = pix[0];
+        pix[1*stride]= v += block[0];
+        pix[2*stride]= v += block[8];
+        pix[3*stride]= v += block[16];
+        pix[4*stride]= v += block[24];
+        pix[5*stride]= v += block[32];
+        pix[6*stride]= v += block[40];
+        pix[7*stride]= v += block[48];
+        pix[8*stride]= v += block[56];
+        pix++;
+        block++;
     }
 }
 
 static void pred8x8l_horizontal_add_c(uint8_t *pix, const DCTELEM *block, int stride){
     int i;
     for(i=0; i<8; i++){
-        pix[0]= pix[-1] + block[0];
-        pix[1]= pix[ 0] + block[1];
-        pix[2]= pix[ 1] + block[2];
-        pix[3]= pix[ 2] + block[3];
-        pix[4]= pix[ 3] + block[4];
-        pix[5]= pix[ 4] + block[5];
-        pix[6]= pix[ 5] + block[6];
-        pix[7]= pix[ 6] + block[7];
+        uint8_t v = pix[-1];
+        pix[0]= v += block[0];
+        pix[1]= v += block[1];
+        pix[2]= v += block[2];
+        pix[3]= v += block[3];
+        pix[4]= v += block[4];
+        pix[5]= v += block[5];
+        pix[6]= v += block[6];
+        pix[7]= v += block[7];
         pix+= stride;
         block+= 8;
     }




More information about the ffmpeg-cvslog mailing list