diff options
Diffstat (limited to 'libavcodec/h264pred_template.c')
-rw-r--r-- | libavcodec/h264pred_template.c | 289 |
1 files changed, 195 insertions, 94 deletions
diff --git a/libavcodec/h264pred_template.c b/libavcodec/h264pred_template.c index 3a1b1cf94e..f08fdf4ba4 100644 --- a/libavcodec/h264pred_template.c +++ b/libavcodec/h264pred_template.c @@ -29,7 +29,9 @@ #include "bit_depth_template.c" -static void FUNCC(pred4x4_vertical)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_vertical)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const pixel4 a= AV_RN4PA(src-stride); @@ -40,7 +42,9 @@ static void FUNCC(pred4x4_vertical)(uint8_t *_src, const uint8_t *topright, int AV_WN4PA(src+3*stride, a); } -static void FUNCC(pred4x4_horizontal)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_horizontal)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); AV_WN4PA(src+0*stride, PIXEL_SPLAT_X4(src[-1+0*stride])); @@ -49,7 +53,9 @@ static void FUNCC(pred4x4_horizontal)(uint8_t *_src, const uint8_t *topright, in AV_WN4PA(src+3*stride, PIXEL_SPLAT_X4(src[-1+3*stride])); } -static void FUNCC(pred4x4_dc)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_dc)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const int dc= ( src[-stride] + src[1-stride] + src[2-stride] + src[3-stride] @@ -62,7 +68,9 @@ static void FUNCC(pred4x4_dc)(uint8_t *_src, const uint8_t *topright, int _strid AV_WN4PA(src+3*stride, a); } -static void FUNCC(pred4x4_left_dc)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_left_dc)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const int dc= ( src[-1+0*stride] + src[-1+1*stride] + src[-1+2*stride] + src[-1+3*stride] + 2) >>2; @@ -74,7 +82,9 @@ static void FUNCC(pred4x4_left_dc)(uint8_t *_src, const uint8_t *topright, int _ AV_WN4PA(src+3*stride, a); } -static void FUNCC(pred4x4_top_dc)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_top_dc)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const int dc= ( src[-stride] + src[1-stride] + src[2-stride] + src[3-stride] + 2) >>2; @@ -86,7 +96,9 @@ static void FUNCC(pred4x4_top_dc)(uint8_t *_src, const uint8_t *topright, int _s AV_WN4PA(src+3*stride, a); } -static void FUNCC(pred4x4_128_dc)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_128_dc)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const pixel4 a = PIXEL_SPLAT_X4(1<<(BIT_DEPTH-1)); @@ -97,7 +109,9 @@ static void FUNCC(pred4x4_128_dc)(uint8_t *_src, const uint8_t *topright, int _s AV_WN4PA(src+3*stride, a); } -static void FUNCC(pred4x4_127_dc)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_127_dc)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const pixel4 a = PIXEL_SPLAT_X4((1<<(BIT_DEPTH-1))-1); @@ -108,7 +122,9 @@ static void FUNCC(pred4x4_127_dc)(uint8_t *_src, const uint8_t *topright, int _s AV_WN4PA(src+3*stride, a); } -static void FUNCC(pred4x4_129_dc)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_129_dc)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const pixel4 a = PIXEL_SPLAT_X4((1<<(BIT_DEPTH-1))+1); @@ -144,7 +160,9 @@ static void FUNCC(pred4x4_129_dc)(uint8_t *_src, const uint8_t *topright, int _s const unsigned av_unused t2 = src[ 2-1*stride];\ const unsigned av_unused t3 = src[ 3-1*stride];\ -static void FUNCC(pred4x4_down_right)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_down_right)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const int lt= src[-1-1*stride]; @@ -169,7 +187,9 @@ static void FUNCC(pred4x4_down_right)(uint8_t *_src, const uint8_t *topright, in src[3+0*stride]=(t1 + 2*t2 + t3 + 2)>>2; } -static void FUNCC(pred4x4_down_left)(uint8_t *_src, const uint8_t *_topright, int _stride){ +static void FUNCC(pred4x4_down_left)(uint8_t *_src, const uint8_t *_topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; const pixel *topright = (const pixel*)_topright; int stride = _stride>>(sizeof(pixel)-1); @@ -195,7 +215,10 @@ static void FUNCC(pred4x4_down_left)(uint8_t *_src, const uint8_t *_topright, in src[3+3*stride]=(t6 + 3*t7 + 2)>>2; } -static void FUNCC(pred4x4_vertical_right)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_vertical_right)(uint8_t *_src, + const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const int lt= src[-1-1*stride]; @@ -220,7 +243,10 @@ static void FUNCC(pred4x4_vertical_right)(uint8_t *_src, const uint8_t *topright src[0+3*stride]=(l0 + 2*l1 + l2 + 2)>>2; } -static void FUNCC(pred4x4_vertical_left)(uint8_t *_src, const uint8_t *_topright, int _stride){ +static void FUNCC(pred4x4_vertical_left)(uint8_t *_src, + const uint8_t *_topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; const pixel *topright = (const pixel*)_topright; int stride = _stride>>(sizeof(pixel)-1); @@ -245,7 +271,9 @@ static void FUNCC(pred4x4_vertical_left)(uint8_t *_src, const uint8_t *_topright src[3+3*stride]=(t4 + 2*t5 + t6 + 2)>>2; } -static void FUNCC(pred4x4_horizontal_up)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_horizontal_up)(uint8_t *_src, const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); LOAD_LEFT_EDGE @@ -268,7 +296,10 @@ static void FUNCC(pred4x4_horizontal_up)(uint8_t *_src, const uint8_t *topright, src[3+3*stride]=l3; } -static void FUNCC(pred4x4_horizontal_down)(uint8_t *_src, const uint8_t *topright, int _stride){ +static void FUNCC(pred4x4_horizontal_down)(uint8_t *_src, + const uint8_t *topright, + ptrdiff_t _stride) +{ pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); const int lt= src[-1-1*stride]; @@ -293,7 +324,8 @@ static void FUNCC(pred4x4_horizontal_down)(uint8_t *_src, const uint8_t *toprigh src[1+3*stride]=(l1 + 2*l2 + l3 + 2)>>2; } -static void FUNCC(pred16x16_vertical)(uint8_t *_src, int _stride){ +static void FUNCC(pred16x16_vertical)(uint8_t *_src, ptrdiff_t _stride) +{ int i; pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); @@ -310,7 +342,8 @@ static void FUNCC(pred16x16_vertical)(uint8_t *_src, int _stride){ } } -static void FUNCC(pred16x16_horizontal)(uint8_t *_src, int stride){ +static void FUNCC(pred16x16_horizontal)(uint8_t *_src, ptrdiff_t stride) +{ int i; pixel *src = (pixel*)_src; stride >>= sizeof(pixel)-1; @@ -334,7 +367,8 @@ static void FUNCC(pred16x16_horizontal)(uint8_t *_src, int stride){ src += stride;\ } -static void FUNCC(pred16x16_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred16x16_dc)(uint8_t *_src, ptrdiff_t stride) +{ int i, dc=0; pixel *src = (pixel*)_src; pixel4 dcsplat; @@ -352,7 +386,8 @@ static void FUNCC(pred16x16_dc)(uint8_t *_src, int stride){ PREDICT_16x16_DC(dcsplat); } -static void FUNCC(pred16x16_left_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred16x16_left_dc)(uint8_t *_src, ptrdiff_t stride) +{ int i, dc=0; pixel *src = (pixel*)_src; pixel4 dcsplat; @@ -366,7 +401,8 @@ static void FUNCC(pred16x16_left_dc)(uint8_t *_src, int stride){ PREDICT_16x16_DC(dcsplat); } -static void FUNCC(pred16x16_top_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred16x16_top_dc)(uint8_t *_src, ptrdiff_t stride) +{ int i, dc=0; pixel *src = (pixel*)_src; pixel4 dcsplat; @@ -381,7 +417,8 @@ static void FUNCC(pred16x16_top_dc)(uint8_t *_src, int stride){ } #define PRED16x16_X(n, v) \ -static void FUNCC(pred16x16_##n##_dc)(uint8_t *_src, int stride){\ +static void FUNCC(pred16x16_##n##_dc)(uint8_t *_src, ptrdiff_t stride)\ +{\ int i;\ pixel *src = (pixel*)_src;\ stride >>= sizeof(pixel)-1;\ @@ -392,12 +429,16 @@ PRED16x16_X(127, (1<<(BIT_DEPTH-1))-1) PRED16x16_X(128, (1<<(BIT_DEPTH-1))+0) PRED16x16_X(129, (1<<(BIT_DEPTH-1))+1) -static inline void FUNCC(pred16x16_plane_compat)(uint8_t *p_src, int p_stride, const int svq3, const int rv40){ +static inline void FUNCC(pred16x16_plane_compat)(uint8_t *_src, + ptrdiff_t _stride, + const int svq3, + const int rv40) +{ int i, j, k; int a; INIT_CLIP - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); const pixel * const src0 = src +7-stride; const pixel * src1 = src +8*stride-1; const pixel * src2 = src1-2*stride; // == src+6*stride-1; @@ -437,11 +478,13 @@ static inline void FUNCC(pred16x16_plane_compat)(uint8_t *p_src, int p_stride, c } } -static void FUNCC(pred16x16_plane)(uint8_t *src, int stride){ +static void FUNCC(pred16x16_plane)(uint8_t *src, ptrdiff_t stride) +{ FUNCC(pred16x16_plane_compat)(src, stride, 0, 0); } -static void FUNCC(pred8x8_vertical)(uint8_t *_src, int _stride){ +static void FUNCC(pred8x8_vertical)(uint8_t *_src, ptrdiff_t _stride) +{ int i; pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); @@ -454,7 +497,8 @@ static void FUNCC(pred8x8_vertical)(uint8_t *_src, int _stride){ } } -static void FUNCC(pred8x16_vertical)(uint8_t *_src, int _stride){ +static void FUNCC(pred8x16_vertical)(uint8_t *_src, ptrdiff_t _stride) +{ int i; pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); @@ -467,7 +511,8 @@ static void FUNCC(pred8x16_vertical)(uint8_t *_src, int _stride){ } } -static void FUNCC(pred8x8_horizontal)(uint8_t *_src, int stride){ +static void FUNCC(pred8x8_horizontal)(uint8_t *_src, ptrdiff_t stride) +{ int i; pixel *src = (pixel*)_src; stride >>= sizeof(pixel)-1; @@ -479,7 +524,8 @@ static void FUNCC(pred8x8_horizontal)(uint8_t *_src, int stride){ } } -static void FUNCC(pred8x16_horizontal)(uint8_t *_src, int stride){ +static void FUNCC(pred8x16_horizontal)(uint8_t *_src, ptrdiff_t stride) +{ int i; pixel *src = (pixel*)_src; stride >>= sizeof(pixel)-1; @@ -491,7 +537,8 @@ static void FUNCC(pred8x16_horizontal)(uint8_t *_src, int stride){ } #define PRED8x8_X(n, v)\ -static void FUNCC(pred8x8_##n##_dc)(uint8_t *_src, int stride){\ +static void FUNCC(pred8x8_##n##_dc)(uint8_t *_src, ptrdiff_t stride)\ +{\ int i;\ const pixel4 a = PIXEL_SPLAT_X4(v);\ pixel *src = (pixel*)_src;\ @@ -506,12 +553,14 @@ PRED8x8_X(127, (1<<(BIT_DEPTH-1))-1) PRED8x8_X(128, (1<<(BIT_DEPTH-1))+0) PRED8x8_X(129, (1<<(BIT_DEPTH-1))+1) -static void FUNCC(pred8x16_128_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred8x16_128_dc)(uint8_t *_src, ptrdiff_t stride) +{ FUNCC(pred8x8_128_dc)(_src, stride); FUNCC(pred8x8_128_dc)(_src+8*stride, stride); } -static void FUNCC(pred8x8_left_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred8x8_left_dc)(uint8_t *_src, ptrdiff_t stride) +{ int i; int dc0, dc2; pixel4 dc0splat, dc2splat; @@ -536,12 +585,14 @@ static void FUNCC(pred8x8_left_dc)(uint8_t *_src, int stride){ } } -static void FUNCC(pred8x16_left_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred8x16_left_dc)(uint8_t *_src, ptrdiff_t stride) +{ FUNCC(pred8x8_left_dc)(_src, stride); FUNCC(pred8x8_left_dc)(_src+8*stride, stride); } -static void FUNCC(pred8x8_top_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred8x8_top_dc)(uint8_t *_src, ptrdiff_t stride) +{ int i; int dc0, dc1; pixel4 dc0splat, dc1splat; @@ -566,7 +617,8 @@ static void FUNCC(pred8x8_top_dc)(uint8_t *_src, int stride){ } } -static void FUNCC(pred8x16_top_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred8x16_top_dc)(uint8_t *_src, ptrdiff_t stride) +{ int i; int dc0, dc1; pixel4 dc0splat, dc1splat; @@ -587,7 +639,8 @@ static void FUNCC(pred8x16_top_dc)(uint8_t *_src, int stride){ } } -static void FUNCC(pred8x8_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred8x8_dc)(uint8_t *_src, ptrdiff_t stride) +{ int i; int dc0, dc1, dc2; pixel4 dc0splat, dc1splat, dc2splat, dc3splat; @@ -615,7 +668,8 @@ static void FUNCC(pred8x8_dc)(uint8_t *_src, int stride){ } } -static void FUNCC(pred8x16_dc)(uint8_t *_src, int stride){ +static void FUNCC(pred8x16_dc)(uint8_t *_src, ptrdiff_t stride) +{ int i; int dc0, dc1, dc2, dc3, dc4; pixel4 dc0splat, dc1splat, dc2splat, dc3splat, dc4splat, dc5splat, dc6splat, dc7splat; @@ -658,51 +712,60 @@ static void FUNCC(pred8x16_dc)(uint8_t *_src, int stride){ } //the following 4 function should not be optimized! -static void FUNC(pred8x8_mad_cow_dc_l0t)(uint8_t *src, int stride){ +static void FUNC(pred8x8_mad_cow_dc_l0t)(uint8_t *src, ptrdiff_t stride) +{ FUNCC(pred8x8_top_dc)(src, stride); FUNCC(pred4x4_dc)(src, NULL, stride); } -static void FUNC(pred8x16_mad_cow_dc_l0t)(uint8_t *src, int stride){ +static void FUNC(pred8x16_mad_cow_dc_l0t)(uint8_t *src, ptrdiff_t stride) +{ FUNCC(pred8x16_top_dc)(src, stride); FUNCC(pred4x4_dc)(src, NULL, stride); } -static void FUNC(pred8x8_mad_cow_dc_0lt)(uint8_t *src, int stride){ +static void FUNC(pred8x8_mad_cow_dc_0lt)(uint8_t *src, ptrdiff_t stride) +{ FUNCC(pred8x8_dc)(src, stride); FUNCC(pred4x4_top_dc)(src, NULL, stride); } -static void FUNC(pred8x16_mad_cow_dc_0lt)(uint8_t *src, int stride){ +static void FUNC(pred8x16_mad_cow_dc_0lt)(uint8_t *src, ptrdiff_t stride) +{ FUNCC(pred8x16_dc)(src, stride); FUNCC(pred4x4_top_dc)(src, NULL, stride); } -static void FUNC(pred8x8_mad_cow_dc_l00)(uint8_t *src, int stride){ +static void FUNC(pred8x8_mad_cow_dc_l00)(uint8_t *src, ptrdiff_t stride) +{ FUNCC(pred8x8_left_dc)(src, stride); FUNCC(pred4x4_128_dc)(src + 4*stride , NULL, stride); FUNCC(pred4x4_128_dc)(src + 4*stride + 4*sizeof(pixel), NULL, stride); } -static void FUNC(pred8x16_mad_cow_dc_l00)(uint8_t *src, int stride){ +static void FUNC(pred8x16_mad_cow_dc_l00)(uint8_t *src, ptrdiff_t stride) +{ FUNCC(pred8x16_left_dc)(src, stride); FUNCC(pred4x4_128_dc)(src + 4*stride , NULL, stride); FUNCC(pred4x4_128_dc)(src + 4*stride + 4*sizeof(pixel), NULL, stride); } -static void FUNC(pred8x8_mad_cow_dc_0l0)(uint8_t *src, int stride){ +static void FUNC(pred8x8_mad_cow_dc_0l0)(uint8_t *src, ptrdiff_t stride) +{ FUNCC(pred8x8_left_dc)(src, stride); FUNCC(pred4x4_128_dc)(src , NULL, stride); FUNCC(pred4x4_128_dc)(src + 4*sizeof(pixel), NULL, stride); } -static void FUNC(pred8x16_mad_cow_dc_0l0)(uint8_t *src, int stride){ +static void FUNC(pred8x16_mad_cow_dc_0l0)(uint8_t *src, ptrdiff_t stride) +{ FUNCC(pred8x16_left_dc)(src, stride); FUNCC(pred4x4_128_dc)(src , NULL, stride); FUNCC(pred4x4_128_dc)(src + 4*sizeof(pixel), NULL, stride); } -static void FUNCC(pred8x8_plane)(uint8_t *_src, int _stride){ +static void FUNCC(pred8x8_plane)(uint8_t *_src, ptrdiff_t _stride) +{ int j, k; int a; INIT_CLIP @@ -737,7 +800,8 @@ static void FUNCC(pred8x8_plane)(uint8_t *_src, int _stride){ } } -static void FUNCC(pred8x16_plane)(uint8_t *_src, int _stride){ +static void FUNCC(pred8x16_plane)(uint8_t *_src, ptrdiff_t _stride) +{ int j, k; int a; INIT_CLIP @@ -816,14 +880,16 @@ static void FUNCC(pred8x16_plane)(uint8_t *_src, int _stride){ src += stride; \ } -static void FUNCC(pred8x8l_128_dc)(uint8_t *_src, int has_topleft, int has_topright, int _stride) +static void FUNCC(pred8x8l_128_dc)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); PREDICT_8x8_DC(PIXEL_SPLAT_X4(1<<(BIT_DEPTH-1))); } -static void FUNCC(pred8x8l_left_dc)(uint8_t *_src, int has_topleft, int has_topright, int _stride) +static void FUNCC(pred8x8l_left_dc)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { pixel *src = (pixel*)_src; int stride = _stride>>(sizeof(pixel)-1); @@ -832,19 +898,21 @@ static void FUNCC(pred8x8l_left_dc)(uint8_t *_src, int has_topleft, int has_topr const pixel4 dc = PIXEL_SPLAT_X4((l0+l1+l2+l3+l4+l5+l6+l7+4) >> 3); PREDICT_8x8_DC(dc); } -static void FUNCC(pred8x8l_top_dc)(uint8_t *p_src, int has_topleft, int has_topright, int p_stride) +static void FUNCC(pred8x8l_top_dc)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); PREDICT_8x8_LOAD_TOP; const pixel4 dc = PIXEL_SPLAT_X4((t0+t1+t2+t3+t4+t5+t6+t7+4) >> 3); PREDICT_8x8_DC(dc); } -static void FUNCC(pred8x8l_dc)(uint8_t *p_src, int has_topleft, int has_topright, int p_stride) +static void FUNCC(pred8x8l_dc)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); PREDICT_8x8_LOAD_LEFT; PREDICT_8x8_LOAD_TOP; @@ -852,10 +920,11 @@ static void FUNCC(pred8x8l_dc)(uint8_t *p_src, int has_topleft, int has_topright +t0+t1+t2+t3+t4+t5+t6+t7+8) >> 4); PREDICT_8x8_DC(dc); } -static void FUNCC(pred8x8l_horizontal)(uint8_t *p_src, int has_topleft, int has_topright, int p_stride) +static void FUNCC(pred8x8l_horizontal)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); pixel4 a; PREDICT_8x8_LOAD_LEFT; @@ -865,7 +934,8 @@ static void FUNCC(pred8x8l_horizontal)(uint8_t *p_src, int has_topleft, int has_ ROW(0); ROW(1); ROW(2); ROW(3); ROW(4); ROW(5); ROW(6); ROW(7); #undef ROW } -static void FUNCC(pred8x8l_vertical)(uint8_t *_src, int has_topleft, int has_topright, int _stride) +static void FUNCC(pred8x8l_vertical)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { int y; pixel *src = (pixel*)_src; @@ -888,10 +958,11 @@ static void FUNCC(pred8x8l_vertical)(uint8_t *_src, int has_topleft, int has_top AV_WN4PA(((pixel4*)(src+y*stride))+1, b); } } -static void FUNCC(pred8x8l_down_left)(uint8_t *p_src, int has_topleft, int has_topright, int p_stride) +static void FUNCC(pred8x8l_down_left)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); PREDICT_8x8_LOAD_TOP; PREDICT_8x8_LOAD_TOPRIGHT; SRC(0,0)= (t0 + 2*t1 + t2 + 2) >> 2; @@ -910,10 +981,11 @@ static void FUNCC(pred8x8l_down_left)(uint8_t *p_src, int has_topleft, int has_t SRC(6,7)=SRC(7,6)= (t13 + 2*t14 + t15 + 2) >> 2; SRC(7,7)= (t14 + 3*t15 + 2) >> 2; } -static void FUNCC(pred8x8l_down_right)(uint8_t *p_src, int has_topleft, int has_topright, int p_stride) +static void FUNCC(pred8x8l_down_right)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); PREDICT_8x8_LOAD_TOP; PREDICT_8x8_LOAD_LEFT; PREDICT_8x8_LOAD_TOPLEFT; @@ -933,10 +1005,11 @@ static void FUNCC(pred8x8l_down_right)(uint8_t *p_src, int has_topleft, int has_ SRC(6,0)=SRC(7,1)= (t4 + 2*t5 + t6 + 2) >> 2; SRC(7,0)= (t5 + 2*t6 + t7 + 2) >> 2; } -static void FUNCC(pred8x8l_vertical_right)(uint8_t *p_src, int has_topleft, int has_topright, int p_stride) +static void FUNCC(pred8x8l_vertical_right)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); PREDICT_8x8_LOAD_TOP; PREDICT_8x8_LOAD_LEFT; PREDICT_8x8_LOAD_TOPLEFT; @@ -963,10 +1036,11 @@ static void FUNCC(pred8x8l_vertical_right)(uint8_t *p_src, int has_topleft, int SRC(7,1)= (t5 + 2*t6 + t7 + 2) >> 2; SRC(7,0)= (t6 + t7 + 1) >> 1; } -static void FUNCC(pred8x8l_horizontal_down)(uint8_t *p_src, int has_topleft, int has_topright, int p_stride) +static void FUNCC(pred8x8l_horizontal_down)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); PREDICT_8x8_LOAD_TOP; PREDICT_8x8_LOAD_LEFT; PREDICT_8x8_LOAD_TOPLEFT; @@ -993,10 +1067,11 @@ static void FUNCC(pred8x8l_horizontal_down)(uint8_t *p_src, int has_topleft, int SRC(6,0)= (t5 + 2*t4 + t3 + 2) >> 2; SRC(7,0)= (t6 + 2*t5 + t4 + 2) >> 2; } -static void FUNCC(pred8x8l_vertical_left)(uint8_t *p_src, int has_topleft, int has_topright, int p_stride) +static void FUNCC(pred8x8l_vertical_left)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); PREDICT_8x8_LOAD_TOP; PREDICT_8x8_LOAD_TOPRIGHT; SRC(0,0)= (t0 + t1 + 1) >> 1; @@ -1022,10 +1097,11 @@ static void FUNCC(pred8x8l_vertical_left)(uint8_t *p_src, int has_topleft, int h SRC(7,6)= (t10 + t11 + 1) >> 1; SRC(7,7)= (t10 + 2*t11 + t12 + 2) >> 2; } -static void FUNCC(pred8x8l_horizontal_up)(uint8_t *p_src, int has_topleft, int has_topright, int p_stride) +static void FUNCC(pred8x8l_horizontal_up)(uint8_t *_src, int has_topleft, + int has_topright, ptrdiff_t _stride) { - pixel *src = (pixel*)p_src; - int stride = p_stride>>(sizeof(pixel)-1); + pixel *src = (pixel*)_src; + int stride = _stride>>(sizeof(pixel)-1); PREDICT_8x8_LOAD_LEFT; SRC(0,0)= (l0 + l1 + 1) >> 1; SRC(1,0)= (l0 + 2*l1 + l2 + 2) >> 2; @@ -1056,10 +1132,12 @@ static void FUNCC(pred8x8l_horizontal_up)(uint8_t *p_src, int has_topleft, int h #undef PL #undef SRC -static void FUNCC(pred4x4_vertical_add)(uint8_t *p_pix, const DCTELEM *p_block, int stride){ +static void FUNCC(pred4x4_vertical_add)(uint8_t *_pix, const DCTELEM *_block, + ptrdiff_t stride) +{ int i; - pixel *pix = (pixel*)p_pix; - const dctcoef *block = (const dctcoef*)p_block; + pixel *pix = (pixel*)_pix; + const dctcoef *block = (const dctcoef*)_block; stride >>= sizeof(pixel)-1; pix -= stride; for(i=0; i<4; i++){ @@ -1073,10 +1151,12 @@ static void FUNCC(pred4x4_vertical_add)(uint8_t *p_pix, const DCTELEM *p_block, } } -static void FUNCC(pred4x4_horizontal_add)(uint8_t *p_pix, const DCTELEM *p_block, int stride){ +static void FUNCC(pred4x4_horizontal_add)(uint8_t *_pix, const DCTELEM *_block, + ptrdiff_t stride) +{ int i; - pixel *pix = (pixel*)p_pix; - const dctcoef *block = (const dctcoef*)p_block; + pixel *pix = (pixel*)_pix; + const dctcoef *block = (const dctcoef*)_block; stride >>= sizeof(pixel)-1; for(i=0; i<4; i++){ pixel v = pix[-1]; @@ -1089,10 +1169,12 @@ static void FUNCC(pred4x4_horizontal_add)(uint8_t *p_pix, const DCTELEM *p_block } } -static void FUNCC(pred8x8l_vertical_add)(uint8_t *p_pix, const DCTELEM *p_block, int stride){ +static void FUNCC(pred8x8l_vertical_add)(uint8_t *_pix, const DCTELEM *_block, + ptrdiff_t stride) +{ int i; - pixel *pix = (pixel*)p_pix; - const dctcoef *block = (const dctcoef*)p_block; + pixel *pix = (pixel*)_pix; + const dctcoef *block = (const dctcoef*)_block; stride >>= sizeof(pixel)-1; pix -= stride; for(i=0; i<8; i++){ @@ -1110,10 +1192,12 @@ static void FUNCC(pred8x8l_vertical_add)(uint8_t *p_pix, const DCTELEM *p_block, } } -static void FUNCC(pred8x8l_horizontal_add)(uint8_t *p_pix, const DCTELEM *p_block, int stride){ +static void FUNCC(pred8x8l_horizontal_add)(uint8_t *_pix, const DCTELEM *_block, + ptrdiff_t stride) +{ int i; - pixel *pix = (pixel*)p_pix; - const dctcoef *block = (const dctcoef*)p_block; + pixel *pix = (pixel*)_pix; + const dctcoef *block = (const dctcoef*)_block; stride >>= sizeof(pixel)-1; for(i=0; i<8; i++){ pixel v = pix[-1]; @@ -1130,25 +1214,36 @@ static void FUNCC(pred8x8l_horizontal_add)(uint8_t *p_pix, const DCTELEM *p_bloc } } -static void FUNCC(pred16x16_vertical_add)(uint8_t *pix, const int *block_offset, const DCTELEM *block, int stride){ +static void FUNCC(pred16x16_vertical_add)(uint8_t *pix, const int *block_offset, + const DCTELEM *block, + ptrdiff_t stride) +{ int i; for(i=0; i<16; i++) FUNCC(pred4x4_vertical_add)(pix + block_offset[i], block + i*16*sizeof(pixel), stride); } -static void FUNCC(pred16x16_horizontal_add)(uint8_t *pix, const int *block_offset, const DCTELEM *block, int stride){ +static void FUNCC(pred16x16_horizontal_add)(uint8_t *pix, + const int *block_offset, + const DCTELEM *block, + ptrdiff_t stride) +{ int i; for(i=0; i<16; i++) FUNCC(pred4x4_horizontal_add)(pix + block_offset[i], block + i*16*sizeof(pixel), stride); } -static void FUNCC(pred8x8_vertical_add)(uint8_t *pix, const int *block_offset, const DCTELEM *block, int stride){ +static void FUNCC(pred8x8_vertical_add)(uint8_t *pix, const int *block_offset, + const DCTELEM *block, ptrdiff_t stride) +{ int i; for(i=0; i<4; i++) FUNCC(pred4x4_vertical_add)(pix + block_offset[i], block + i*16*sizeof(pixel), stride); } -static void FUNCC(pred8x16_vertical_add)(uint8_t *pix, const int *block_offset, const DCTELEM *block, int stride){ +static void FUNCC(pred8x16_vertical_add)(uint8_t *pix, const int *block_offset, + const DCTELEM *block, ptrdiff_t stride) +{ int i; for(i=0; i<4; i++) FUNCC(pred4x4_vertical_add)(pix + block_offset[i], block + i*16*sizeof(pixel), stride); @@ -1156,13 +1251,19 @@ static void FUNCC(pred8x16_vertical_add)(uint8_t *pix, const int *block_offset, FUNCC(pred4x4_vertical_add)(pix + block_offset[i+4], block + i*16*sizeof(pixel), stride); } -static void FUNCC(pred8x8_horizontal_add)(uint8_t *pix, const int *block_offset, const DCTELEM *block, int stride){ +static void FUNCC(pred8x8_horizontal_add)(uint8_t *pix, const int *block_offset, + const DCTELEM *block, + ptrdiff_t stride) +{ int i; for(i=0; i<4; i++) FUNCC(pred4x4_horizontal_add)(pix + block_offset[i], block + i*16*sizeof(pixel), stride); } -static void FUNCC(pred8x16_horizontal_add)(uint8_t *pix, const int *block_offset, const DCTELEM *block, int stride){ +static void FUNCC(pred8x16_horizontal_add)(uint8_t *pix, + const int *block_offset, + const DCTELEM *block, ptrdiff_t stride) +{ int i; for(i=0; i<4; i++) FUNCC(pred4x4_horizontal_add)(pix + block_offset[i], block + i*16*sizeof(pixel), stride); |