#include "asm.h"
static void get_pixels_mvi(int16_t *restrict block,
- const uint8_t *restrict pixels, ptrdiff_t line_size)
+ const uint8_t *restrict pixels, ptrdiff_t stride)
{
int h = 8;
stq(unpkbw(p), block);
stq(unpkbw(p >> 32), block + 4);
- pixels += line_size;
+ pixels += stride;
block += 8;
} while (--h);
}
static void diff_pixels_mvi(int16_t *block, const uint8_t *s1, const uint8_t *s2,
- int stride) {
+ ptrdiff_t stride)
+{
int h = 8;
uint64_t mask = 0x4040;
#include "libavcodec/avcodec.h"
#include "libavcodec/pixblockdsp.h"
-void ff_get_pixels_armv6(int16_t *block, const uint8_t *pixels, ptrdiff_t stride);
+void ff_get_pixels_armv6(int16_t *block, const uint8_t *pixels,
+ ptrdiff_t stride);
void ff_diff_pixels_armv6(int16_t *block, const uint8_t *s1,
- const uint8_t *s2, int stride);
+ const uint8_t *s2, ptrdiff_t stride);
av_cold void ff_pixblockdsp_init_arm(PixblockDSPContext *c,
AVCodecContext *avctx,
uint8_t dv_zigzag[2][64];
- void (*get_pixels)(int16_t *block, const uint8_t *pixels, ptrdiff_t line_size);
+ void (*get_pixels)(int16_t *block, const uint8_t *pixels, ptrdiff_t linesize);
void (*fdct[2])(int16_t *block);
void (*idct_put[2])(uint8_t *dest, int line_size, int16_t *block);
me_cmp_func ildct_cmp;
}
static av_always_inline int dv_guess_dct_mode(DVVideoContext *s, uint8_t *data,
- int linesize)
+ ptrdiff_t linesize)
{
if (s->avctx->flags & AV_CODEC_FLAG_INTERLACED_DCT) {
int ps = s->ildct_cmp(NULL, data, NULL, linesize, 8) - 400;
};
static av_always_inline int dv_init_enc_block(EncBlockInfo *bi, uint8_t *data,
- int linesize, DVVideoContext *s,
- int bias)
+ ptrdiff_t linesize,
+ DVVideoContext *s, int bias)
{
const int *weight;
const uint8_t *zigzag_scan;
DVVideoContext *s = avctx->priv_data;
DVwork_chunk *work_chunk = arg;
int mb_index, i, j;
- int mb_x, mb_y, c_offset, linesize, y_stride;
+ int mb_x, mb_y, c_offset;
+ ptrdiff_t linesize, y_stride;
uint8_t *y_ptr;
uint8_t *dif;
LOCAL_ALIGNED_8(uint8_t, scratch, [128]);
#include "../mpegvideo.h"
void ff_diff_pixels_msa(int16_t *av_restrict block, const uint8_t *src1,
- const uint8_t *src2, int stride);
+ const uint8_t *src2, ptrdiff_t stride);
void ff_get_pixels_16_msa(int16_t *restrict dst, const uint8_t *src,
ptrdiff_t stride);
void ff_get_pixels_8_msa(int16_t *restrict dst, const uint8_t *src,
ptrdiff_t stride);
void ff_get_pixels_8_mmi(int16_t *av_restrict block, const uint8_t *pixels,
- ptrdiff_t line_size);
+ ptrdiff_t stride);
void ff_diff_pixels_mmi(int16_t *av_restrict block, const uint8_t *src1,
- const uint8_t *src2, int stride);
+ const uint8_t *src2, ptrdiff_t stride);
#endif // #ifndef AVCODEC_MIPS_PIXBLOCKDSP_MIPS_H
#include "libavutil/mips/mmiutils.h"
void ff_get_pixels_8_mmi(int16_t *av_restrict block, const uint8_t *pixels,
- ptrdiff_t line_size)
+ ptrdiff_t stride)
{
double ftmp[7];
DECLARE_VAR_ALL64;
"xor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
MMI_LDC1(%[ftmp1], %[pixels], 0x00)
- MMI_LDXC1(%[ftmp2], %[pixels], %[line_size], 0x00)
+ MMI_LDXC1(%[ftmp2], %[pixels], %[stride], 0x00)
"punpcklbh %[ftmp3], %[ftmp1], %[ftmp0] \n\t"
"punpckhbh %[ftmp4], %[ftmp1], %[ftmp0] \n\t"
"punpcklbh %[ftmp5], %[ftmp2], %[ftmp0] \n\t"
MMI_SDC1(%[ftmp4], %[block], 0x08)
MMI_SDC1(%[ftmp5], %[block], 0x10)
MMI_SDC1(%[ftmp6], %[block], 0x18)
- PTR_ADDU "%[pixels], %[pixels], %[line_size_x2] \n\t"
+ PTR_ADDU "%[pixels], %[pixels], %[stride_x2] \n\t"
MMI_LDC1(%[ftmp1], %[pixels], 0x00)
- MMI_LDXC1(%[ftmp2], %[pixels], %[line_size], 0x00)
+ MMI_LDXC1(%[ftmp2], %[pixels], %[stride], 0x00)
"punpcklbh %[ftmp3], %[ftmp1], %[ftmp0] \n\t"
"punpckhbh %[ftmp4], %[ftmp1], %[ftmp0] \n\t"
"punpcklbh %[ftmp5], %[ftmp2], %[ftmp0] \n\t"
MMI_SDC1(%[ftmp4], %[block], 0x28)
MMI_SDC1(%[ftmp5], %[block], 0x30)
MMI_SDC1(%[ftmp6], %[block], 0x38)
- PTR_ADDU "%[pixels], %[pixels], %[line_size_x2] \n\t"
+ PTR_ADDU "%[pixels], %[pixels], %[stride_x2] \n\t"
MMI_LDC1(%[ftmp1], %[pixels], 0x00)
- MMI_LDXC1(%[ftmp2], %[pixels], %[line_size], 0x00)
+ MMI_LDXC1(%[ftmp2], %[pixels], %[stride], 0x00)
"punpcklbh %[ftmp3], %[ftmp1], %[ftmp0] \n\t"
"punpckhbh %[ftmp4], %[ftmp1], %[ftmp0] \n\t"
"punpcklbh %[ftmp5], %[ftmp2], %[ftmp0] \n\t"
MMI_SDC1(%[ftmp4], %[block], 0x48)
MMI_SDC1(%[ftmp5], %[block], 0x50)
MMI_SDC1(%[ftmp6], %[block], 0x58)
- PTR_ADDU "%[pixels], %[pixels], %[line_size_x2] \n\t"
+ PTR_ADDU "%[pixels], %[pixels], %[stride_x2] \n\t"
MMI_LDC1(%[ftmp1], %[pixels], 0x00)
- MMI_LDXC1(%[ftmp2], %[pixels], %[line_size], 0x00)
+ MMI_LDXC1(%[ftmp2], %[pixels], %[stride], 0x00)
"punpcklbh %[ftmp3], %[ftmp1], %[ftmp0] \n\t"
"punpckhbh %[ftmp4], %[ftmp1], %[ftmp0] \n\t"
"punpcklbh %[ftmp5], %[ftmp2], %[ftmp0] \n\t"
RESTRICT_ASM_ALL64
RESTRICT_ASM_ADDRT
[pixels]"+&r"(pixels)
- : [block]"r"((mips_reg)block), [line_size]"r"((mips_reg)line_size),
- [line_size_x2]"r"((mips_reg)(line_size<<1))
+ : [block]"r"((mips_reg)block), [stride]"r"((mips_reg)stride),
+ [stride_x2]"r"((mips_reg)(stride<<1))
: "memory"
);
}
void ff_diff_pixels_mmi(int16_t *av_restrict block, const uint8_t *src1,
- const uint8_t *src2, int stride)
+ const uint8_t *src2, ptrdiff_t stride)
{
double ftmp[5];
mips_reg tmp[1];
}
void ff_diff_pixels_msa(int16_t *av_restrict block, const uint8_t *src1,
- const uint8_t *src2, int stride)
+ const uint8_t *src2, ptrdiff_t stride)
{
diff_pixels_msa(block, src1, src2, stride);
}
#include "pixblockdsp.h"
static void get_pixels_16_c(int16_t *av_restrict block, const uint8_t *pixels,
- ptrdiff_t line_size)
+ ptrdiff_t stride)
{
- AV_COPY128U(block + 0 * 8, pixels + 0 * line_size);
- AV_COPY128U(block + 1 * 8, pixels + 1 * line_size);
- AV_COPY128U(block + 2 * 8, pixels + 2 * line_size);
- AV_COPY128U(block + 3 * 8, pixels + 3 * line_size);
- AV_COPY128U(block + 4 * 8, pixels + 4 * line_size);
- AV_COPY128U(block + 5 * 8, pixels + 5 * line_size);
- AV_COPY128U(block + 6 * 8, pixels + 6 * line_size);
- AV_COPY128U(block + 7 * 8, pixels + 7 * line_size);
+ AV_COPY128U(block + 0 * 8, pixels + 0 * stride);
+ AV_COPY128U(block + 1 * 8, pixels + 1 * stride);
+ AV_COPY128U(block + 2 * 8, pixels + 2 * stride);
+ AV_COPY128U(block + 3 * 8, pixels + 3 * stride);
+ AV_COPY128U(block + 4 * 8, pixels + 4 * stride);
+ AV_COPY128U(block + 5 * 8, pixels + 5 * stride);
+ AV_COPY128U(block + 6 * 8, pixels + 6 * stride);
+ AV_COPY128U(block + 7 * 8, pixels + 7 * stride);
}
static void get_pixels_8_c(int16_t *av_restrict block, const uint8_t *pixels,
- ptrdiff_t line_size)
+ ptrdiff_t stride)
{
int i;
block[5] = pixels[5];
block[6] = pixels[6];
block[7] = pixels[7];
- pixels += line_size;
+ pixels += stride;
block += 8;
}
}
static void diff_pixels_c(int16_t *av_restrict block, const uint8_t *s1,
- const uint8_t *s2, int stride)
+ const uint8_t *s2, ptrdiff_t stride)
{
int i;
typedef struct PixblockDSPContext {
void (*get_pixels)(int16_t *block /* align 16 */,
const uint8_t *pixels /* align 8 */,
- ptrdiff_t line_size);
+ ptrdiff_t stride);
void (*diff_pixels)(int16_t *block /* align 16 */,
const uint8_t *s1 /* align 8 */,
const uint8_t *s2 /* align 8 */,
- int stride);
+ ptrdiff_t stride);
} PixblockDSPContext;
void ff_pixblockdsp_init(PixblockDSPContext *c, AVCodecContext *avctx);
#if HAVE_VSX
static void get_pixels_altivec(int16_t *restrict block, const uint8_t *pixels,
- ptrdiff_t line_size)
+ ptrdiff_t stride)
{
int i;
vector unsigned char perm =
// Save the data to the block, we assume the block is 16-byte aligned.
vec_vsx_st(shorts, i * 16, (vector signed short *) block);
- pixels += line_size;
+ pixels += stride;
}
}
#else
static void get_pixels_altivec(int16_t *restrict block, const uint8_t *pixels,
- ptrdiff_t line_size)
+ ptrdiff_t stride)
{
int i;
const vec_u8 zero = (const vec_u8)vec_splat_u8(0);
// Save the data to the block, we assume the block is 16-byte aligned.
vec_st(shorts, i * 16, (vec_s16 *)block);
- pixels += line_size;
+ pixels += stride;
}
}
#if HAVE_VSX
static void diff_pixels_altivec(int16_t *restrict block, const uint8_t *s1,
- const uint8_t *s2, int stride)
+ const uint8_t *s2, ptrdiff_t stride)
{
int i;
const vector unsigned char zero =
}
#else
static void diff_pixels_altivec(int16_t *restrict block, const uint8_t *s1,
- const uint8_t *s2, int stride)
+ const uint8_t *s2, ptrdiff_t stride)
{
int i;
vec_u8 perm;
#if HAVE_VSX
static void get_pixels_vsx(int16_t *restrict block, const uint8_t *pixels,
- ptrdiff_t line_size)
+ ptrdiff_t stride)
{
int i;
for (i = 0; i < 8; i++) {
vec_vsx_st(shorts, i * 16, block);
- pixels += line_size;
+ pixels += stride;
}
}
static void diff_pixels_vsx(int16_t *restrict block, const uint8_t *s1,
- const uint8_t *s2, int stride)
+ const uint8_t *s2, ptrdiff_t stride)
{
int i;
vec_s16 shorts1, shorts2;
SECTION .text
INIT_MMX mmx
-; void ff_get_pixels_mmx(int16_t *block, const uint8_t *pixels, ptrdiff_t line_size)
+; void ff_get_pixels_mmx(int16_t *block, const uint8_t *pixels, ptrdiff_t stride)
cglobal get_pixels, 3,4
add r0, 128
mov r3, -128
RET
; void ff_diff_pixels_mmx(int16_t *block, const uint8_t *s1, const uint8_t *s2,
-; int stride);
+; ptrdiff_t stride);
%macro DIFF_PIXELS 0
cglobal diff_pixels, 4,5,5
- movsxdifnidn r3, r3d
pxor m4, m4
add r0, 128
mov r4, -128
#include "libavutil/x86/cpu.h"
#include "libavcodec/pixblockdsp.h"
-void ff_get_pixels_mmx(int16_t *block, const uint8_t *pixels, ptrdiff_t line_size);
-void ff_get_pixels_sse2(int16_t *block, const uint8_t *pixels, ptrdiff_t line_size);
+void ff_get_pixels_mmx(int16_t *block, const uint8_t *pixels, ptrdiff_t stride);
+void ff_get_pixels_sse2(int16_t *block, const uint8_t *pixels, ptrdiff_t stride);
void ff_diff_pixels_mmx(int16_t *block, const uint8_t *s1, const uint8_t *s2,
- int stride);
+ ptrdiff_t stride);
void ff_diff_pixels_sse2(int16_t *block, const uint8_t *s1, const uint8_t *s2,
- int stride);
+ ptrdiff_t stride);
av_cold void ff_pixblockdsp_init_x86(PixblockDSPContext *c,
AVCodecContext *avctx,
#define check_diff_pixels(type) \
do { \
int i; \
- declare_func_emms(AV_CPU_FLAG_MMX, void, int16_t *av_restrict block, const uint8_t *s1, const uint8_t *s2, int stride); \
+ declare_func_emms(AV_CPU_FLAG_MMX, void, int16_t *av_restrict block, const uint8_t *s1, const uint8_t *s2, ptrdiff_t stride); \
\
for (i = 0; i < BUF_UNITS; i++) { \
int src_offset = i * 64 * sizeof(type) + 8 * i; /* Test various alignments */ \