Commit 5f7576b3 authored by reimar's avatar reimar

Replace bytecopy with the equivalent but faster av_memcpy_backptr.

Ca. 10% faster xan_unpack on x86_64 decoding of SC_32-part.MVE


git-svn-id: file:///var/local/repositories/ffmpeg/trunk@18572 9553f0bf-9b14-0410-a0b8-cfaf0461ba5b
parent 5162e5b9
...@@ -35,6 +35,8 @@ ...@@ -35,6 +35,8 @@
#include "libavutil/intreadwrite.h" #include "libavutil/intreadwrite.h"
#include "avcodec.h" #include "avcodec.h"
// for av_memcpy_backptr
#include "libavutil/lzo.h"
typedef struct XanContext { typedef struct XanContext {
...@@ -76,26 +78,13 @@ static av_cold int xan_decode_init(AVCodecContext *avctx) ...@@ -76,26 +78,13 @@ static av_cold int xan_decode_init(AVCodecContext *avctx)
s->buffer1_size = avctx->width * avctx->height; s->buffer1_size = avctx->width * avctx->height;
s->buffer1 = av_malloc(s->buffer1_size); s->buffer1 = av_malloc(s->buffer1_size);
s->buffer2_size = avctx->width * avctx->height; s->buffer2_size = avctx->width * avctx->height;
s->buffer2 = av_malloc(s->buffer2_size); s->buffer2 = av_malloc(s->buffer2_size + 12);
if (!s->buffer1 || !s->buffer2) if (!s->buffer1 || !s->buffer2)
return -1; return -1;
return 0; return 0;
} }
/* This function is used in lieu of memcpy(). This decoder cannot use
* memcpy because the memory locations often overlap and
* memcpy doesn't like that; it's not uncommon, for example, for
* dest = src+1, to turn byte A into pattern AAAAAAAA.
* This was originally repz movsb in Intel x86 ASM. */
static inline void bytecopy(unsigned char *dest, const unsigned char *src, int count)
{
int i;
for (i = 0; i < count; i++)
dest[i] = src[i];
}
static int xan_huffman_decode(unsigned char *dest, const unsigned char *src, static int xan_huffman_decode(unsigned char *dest, const unsigned char *src,
int dest_len) int dest_len)
{ {
...@@ -130,6 +119,11 @@ static int xan_huffman_decode(unsigned char *dest, const unsigned char *src, ...@@ -130,6 +119,11 @@ static int xan_huffman_decode(unsigned char *dest, const unsigned char *src,
return 0; return 0;
} }
/**
* unpack simple compression
*
* @param dest destination buffer of dest_len, must be sufficiently padded for av_memcpy_backptr
*/
static void xan_unpack(unsigned char *dest, const unsigned char *src, int dest_len) static void xan_unpack(unsigned char *dest, const unsigned char *src, int dest_len)
{ {
unsigned char opcode; unsigned char opcode;
...@@ -153,7 +147,7 @@ static void xan_unpack(unsigned char *dest, const unsigned char *src, int dest_l ...@@ -153,7 +147,7 @@ static void xan_unpack(unsigned char *dest, const unsigned char *src, int dest_l
size = ((opcode & 0x1c) >> 2) + 3; size = ((opcode & 0x1c) >> 2) + 3;
if (dest + size > dest_end) if (dest + size > dest_end)
return; return;
bytecopy (dest, dest - (((opcode & 0x60) << 3) + offset + 1), size); av_memcpy_backptr(dest, ((opcode & 0x60) << 3) + offset + 1, size);
dest += size; dest += size;
} else if ( (opcode & 0x40) == 0 ) { } else if ( (opcode & 0x40) == 0 ) {
...@@ -169,7 +163,7 @@ static void xan_unpack(unsigned char *dest, const unsigned char *src, int dest_l ...@@ -169,7 +163,7 @@ static void xan_unpack(unsigned char *dest, const unsigned char *src, int dest_l
size = (opcode & 0x3f) + 4; size = (opcode & 0x3f) + 4;
if (dest + size > dest_end) if (dest + size > dest_end)
return; return;
bytecopy (dest, dest - (((byte1 & 0x3f) << 8) + byte2 + 1), size); av_memcpy_backptr(dest, ((byte1 & 0x3f) << 8) + byte2 + 1, size);
dest += size; dest += size;
} else if ( (opcode & 0x20) == 0 ) { } else if ( (opcode & 0x20) == 0 ) {
...@@ -186,8 +180,8 @@ static void xan_unpack(unsigned char *dest, const unsigned char *src, int dest_l ...@@ -186,8 +180,8 @@ static void xan_unpack(unsigned char *dest, const unsigned char *src, int dest_l
size = byte3 + 5 + ((opcode & 0xc) << 6); size = byte3 + 5 + ((opcode & 0xc) << 6);
if (dest + size > dest_end) if (dest + size > dest_end)
return; return;
bytecopy (dest, av_memcpy_backptr(dest,
dest - ((((opcode & 0x10) >> 4) << 0x10) + 1 + (byte1 << 8) + byte2), (((opcode & 0x10) >> 4) << 0x10) + 1 + (byte1 << 8) + byte2,
size); size);
dest += size; dest += size;
} else { } else {
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment