[FFmpeg-devel] [PATCH] sgidec: make compiler optimize away memcpy call in inner loop.
Reimar Döffinger
Reimar.Doeffinger at gmx.de
Sun Jan 8 12:21:25 CET 2012
Using an always_inline function makes the memcpy length a constant,
any reasonable compiler will replace it by a single mov instruction
without us having to duplicate the actual code.
Signed-off-by: Reimar Döffinger <Reimar.Doeffinger at gmx.de>
---
libavcodec/sgidec.c | 38 +++++++++++++++++++++++++-------------
1 files changed, 25 insertions(+), 13 deletions(-)
diff --git a/libavcodec/sgidec.c b/libavcodec/sgidec.c
index ae05d83..98327a8 100644
--- a/libavcodec/sgidec.c
+++ b/libavcodec/sgidec.c
@@ -20,6 +20,7 @@
*/
#include "libavutil/imgutils.h"
+#include "libavutil/avassert.h"
#include "avcodec.h"
#include "bytestream.h"
#include "sgi.h"
@@ -113,6 +114,25 @@ static int read_rle_sgi(unsigned char* out_buf, const uint8_t *in_buf,
return 0;
}
+static av_always_inline void copy_loop(uint8_t *out_buf, const uint8_t *in_buf,
+ unsigned offset, unsigned bytes_per_channel,
+ SgiState *s)
+{
+ int x, y, z;
+ for (y = s->height - 1; y >= 0; y--) {
+ uint8_t *line = out_buf + (y * s->linesize);
+ for (x = s->width; x > 0; x--) {
+ const uint8_t *ptr = in_buf;
+ in_buf += bytes_per_channel;
+ for(z = 0; z < s->depth; z ++) {
+ memcpy(line, ptr, bytes_per_channel);
+ line += bytes_per_channel;
+ ptr += offset;
+ }
+ }
+ }
+}
+
/**
* Read an uncompressed SGI image.
* @param out_buf output buffer
@@ -125,8 +145,6 @@ static int read_rle_sgi(unsigned char* out_buf, const uint8_t *in_buf,
static int read_uncompressed_sgi(unsigned char* out_buf, uint8_t* out_end,
const uint8_t *in_buf, const uint8_t *in_end, SgiState* s)
{
- int x, y, z;
- const uint8_t *ptr;
unsigned int offset = s->height * s->width * s->bytes_per_channel;
/* Test buffer size. */
@@ -134,17 +152,11 @@ static int read_uncompressed_sgi(unsigned char* out_buf, uint8_t* out_end,
return -1;
}
- for (y = s->height - 1; y >= 0; y--) {
- out_end = out_buf + (y * s->linesize);
- for (x = s->width; x > 0; x--) {
- ptr = in_buf;
- in_buf += s->bytes_per_channel;
- for(z = 0; z < s->depth; z ++) {
- memcpy(out_end, ptr, s->bytes_per_channel);
- out_end += s->bytes_per_channel;
- ptr += offset;
- }
- }
+ if (s->bytes_per_channel == 2) {
+ copy_loop(out_buf, in_buf, offset, 2, s);
+ } else {
+ av_assert1(s->bytes_per_channel == 1);
+ copy_loop(out_buf, in_buf, offset, 1, s);
}
return 0;
}
--
1.7.8.3
More information about the ffmpeg-devel
mailing list