diff --git a/libavcodec/x86/h264_deblock.asm b/libavcodec/x86/h264_deblock.asm index 435c8be56f..509a0dbe0c 100644 --- a/libavcodec/x86/h264_deblock.asm +++ b/libavcodec/x86/h264_deblock.asm @@ -282,18 +282,18 @@ cextern pb_3 ; int8_t *tc0) ;----------------------------------------------------------------------------- %macro DEBLOCK_LUMA 0 -cglobal deblock_v_luma_8, 5,5,10 +cglobal deblock_v_luma_8, 5,5,10, pix_, stride_, alpha_, beta_, base3_ movd m8, [r4] ; tc0 - lea r4, [r1*3] - dec r2d ; alpha-1 + lea r4, [stride_q*3] + dec alpha_d ; alpha-1 neg r4 - dec r3d ; beta-1 - add r4, r0 ; pix-3*stride + dec beta_d ; beta-1 + add base3_q, pix_q ; pix-3*stride - mova m0, [r4+r1] ; p1 - mova m1, [r4+2*r1] ; p0 - mova m2, [r0] ; q0 - mova m3, [r0+r1] ; q1 + mova m0, [base3_q + stride_q] ; p1 + mova m1, [base3_q + 2*stride_q] ; p0 + mova m2, [pix_q] ; q0 + mova m3, [pix_q + stride_q] ; q1 LOAD_MASK r2d, r3d punpcklbw m8, m8 @@ -303,24 +303,24 @@ cglobal deblock_v_luma_8, 5,5,10 pandn m9, m7 pand m8, m9 - movdqa m3, [r4] ; p2 + movdqa m3, [base3_q] ; p2 DIFF_GT2 m1, m3, m5, m6, m7 ; |p2-p0| > beta-1 pand m6, m9 psubb m7, m8, m6 pand m6, m8 - LUMA_Q1 m0, m3, [r4], [r4+r1], m6, m4 + LUMA_Q1 m0, m3, [base3_q], [base3_q + stride_q], m6, m4 - movdqa m4, [r0+2*r1] ; q2 + movdqa m4, [pix_q + 2*stride_q] ; q2 DIFF_GT2 m2, m4, m5, m6, m3 ; |q2-q0| > beta-1 pand m6, m9 pand m8, m6 psubb m7, m6 - mova m3, [r0+r1] - LUMA_Q1 m3, m4, [r0+2*r1], [r0+r1], m8, m6 + mova m3, [pix_q + stride_q] + LUMA_Q1 m3, m4, [pix_q + 2*stride_q], [pix_q + stride_q], m8, m6 DEBLOCK_P0_Q0 - mova [r4+2*r1], m1 - mova [r0], m2 + mova [base3_q + 2*stride_q], m1 + mova [pix_q], m2 RET ;-----------------------------------------------------------------------------