[FFmpeg-cvslog] lavu/ripemd: Add a size optimized version of the transform functions

James Almer git at videolan.org
Mon Sep 9 11:40:28 CEST 2013


ffmpeg | branch: master | James Almer <jamrial at gmail.com> | Mon Sep  9 05:42:22 2013 -0300| [8702a94e49922880f5d5b89ce41a0a776c0f9561] | committer: Michael Niedermayer

lavu/ripemd: Add a size optimized version of the transform functions

When compiling with --enable-small, ripemd.o will weigh a few kilobytes less than
it used to before the previous commit.

Signed-off-by: James Almer <jamrial at gmail.com>
Signed-off-by: Michael Niedermayer <michaelni at gmx.at>

> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=8702a94e49922880f5d5b89ce41a0a776c0f9561
---

 libavutil/ripemd.c |   75 +++++++++++++++++++++++++++++++++++++++++++++++++---
 1 file changed, 72 insertions(+), 3 deletions(-)

diff --git a/libavutil/ripemd.c b/libavutil/ripemd.c
index 37b42df..1ceb24b 100644
--- a/libavutil/ripemd.c
+++ b/libavutil/ripemd.c
@@ -88,7 +88,7 @@ static const int WB[80] = {
 
 #define rol(value, bits) ((value << bits) | (value >> (32 - bits)))
 
-#define SWAP(a,b) if (ext) { int t = a; a = b; b = t; }
+#define SWAP(a,b) if (ext) { t = a; a = b; b = t; }
 
 #define ROUND128_0_TO_15(a,b,c,d,e,f,g,h)                               \
     a = rol(a + ((  b ^ c  ^ d)      + block[WA[n]]),         ROTA[n]); \
@@ -112,7 +112,7 @@ static const int WB[80] = {
 
 static void ripemd128_transform(uint32_t *state, const uint8_t buffer[64], int ext)
 {
-    uint32_t a, b, c, d, e, f, g, h;
+    uint32_t a, b, c, d, e, f, g, h, t;
     uint32_t block[16];
     int n;
 
@@ -130,6 +130,36 @@ static void ripemd128_transform(uint32_t *state, const uint8_t buffer[64], int e
         block[n] = AV_RL32(buffer + 4 * n);
     n = 0;
 
+#if CONFIG_SMALL
+    for (; n < 16;) {
+        ROUND128_0_TO_15(a,b,c,d,e,f,g,h);
+        t = d; d = c; c = b; b = a; a = t;
+        t = h; h = g; g = f; f = e; e = t;
+    }
+    SWAP(a,e)
+
+    for (; n < 32;) {
+        ROUND128_16_TO_31(a,b,c,d,e,f,g,h);
+        t = d; d = c; c = b; b = a; a = t;
+        t = h; h = g; g = f; f = e; e = t;
+    }
+    SWAP(b,f)
+
+    for (; n < 48;) {
+        ROUND128_32_TO_47(a,b,c,d,e,f,g,h);
+        t = d; d = c; c = b; b = a; a = t;
+        t = h; h = g; g = f; f = e; e = t;
+    }
+    SWAP(c,g)
+
+    for (; n < 64;) {
+        ROUND128_48_TO_63(a,b,c,d,e,f,g,h);
+        t = d; d = c; c = b; b = a; a = t;
+        t = h; h = g; g = f; f = e; e = t;
+    }
+    SWAP(d,h)
+#else
+
 #define R128_0                         \
     ROUND128_0_TO_15(a,b,c,d,e,f,g,h); \
     ROUND128_0_TO_15(d,a,b,c,h,e,f,g); \
@@ -165,6 +195,7 @@ static void ripemd128_transform(uint32_t *state, const uint8_t buffer[64], int e
 
     R128_48; R128_48; R128_48; R128_48;
     SWAP(d,h)
+#endif
 
     if (ext) {
         state[0] += a; state[1] += b; state[2] += c; state[3] += d;
@@ -210,7 +241,7 @@ static void ripemd128_transform(uint32_t *state, const uint8_t buffer[64], int e
 
 static void ripemd160_transform(uint32_t *state, const uint8_t buffer[64], int ext)
 {
-    uint32_t a, b, c, d, e, f, g, h, i, j;
+    uint32_t a, b, c, d, e, f, g, h, i, j, t;
     uint32_t block[16];
     int n;
 
@@ -229,6 +260,43 @@ static void ripemd160_transform(uint32_t *state, const uint8_t buffer[64], int e
         block[n] = AV_RL32(buffer + 4 * n);
     n = 0;
 
+#if CONFIG_SMALL
+    for (; n < 16;) {
+        ROUND160_0_TO_15(a,b,c,d,e,f,g,h,i,j);
+        t = e; e = d; d = c; c = b; b = a; a = t;
+        t = j; j = i; i = h; h = g; g = f; f = t;
+    }
+    SWAP(b,g)
+
+    for (; n < 32;) {
+        ROUND160_16_TO_31(a,b,c,d,e,f,g,h,i,j);
+        t = e; e = d; d = c; c = b; b = a; a = t;
+        t = j; j = i; i = h; h = g; g = f; f = t;
+    }
+    SWAP(d,i)
+
+    for (; n < 48;) {
+        ROUND160_32_TO_47(a,b,c,d,e,f,g,h,i,j);
+        t = e; e = d; d = c; c = b; b = a; a = t;
+        t = j; j = i; i = h; h = g; g = f; f = t;
+    }
+    SWAP(a,f)
+
+    for (; n < 64;) {
+        ROUND160_48_TO_63(a,b,c,d,e,f,g,h,i,j);
+        t = e; e = d; d = c; c = b; b = a; a = t;
+        t = j; j = i; i = h; h = g; g = f; f = t;
+    }
+    SWAP(c,h)
+
+    for (; n < 80;) {
+        ROUND160_64_TO_79(a,b,c,d,e,f,g,h,i,j);
+        t = e; e = d; d = c; c = b; b = a; a = t;
+        t = j; j = i; i = h; h = g; g = f; f = t;
+    }
+    SWAP(e,j)
+#else
+
 #define R160_0                             \
     ROUND160_0_TO_15(a,b,c,d,e,f,g,h,i,j); \
     ROUND160_0_TO_15(e,a,b,c,d,j,f,g,h,i); \
@@ -283,6 +351,7 @@ static void ripemd160_transform(uint32_t *state, const uint8_t buffer[64], int e
     R160_64; R160_64; R160_64;
     ROUND160_64_TO_79(b,c,d,e,a,g,h,i,j,f);
     SWAP(e,j)
+#endif
 
     if (ext) {
         state[0] += a; state[1] += b; state[2] += c; state[3] += d; state[4] += e;



More information about the ffmpeg-cvslog mailing list