This is an automated email from the git hooks/post-receive script.

Git pushed a commit to branch master
in repository ffmpeg.

commit 8901f858eb14f720e316ea5c1f195cf004956f55
Author:     Andreas Rheinhardt <[email protected]>
AuthorDate: Thu Mar 19 14:33:55 2026 +0100
Commit:     Andreas Rheinhardt <[email protected]>
CommitDate: Mon Mar 30 13:51:53 2026 +0200

    avcodec/x86/vvc/alf: Hoist creating shift register out of loop
    
    Possible now that this function no longer uses unnecessarily many
    registers.
    
    Signed-off-by: Andreas Rheinhardt <[email protected]>
---
 libavcodec/x86/vvc/alf.asm | 11 ++++-------
 1 file changed, 4 insertions(+), 7 deletions(-)

diff --git a/libavcodec/x86/vvc/alf.asm b/libavcodec/x86/vvc/alf.asm
index c52660d222..4dc396afce 100644
--- a/libavcodec/x86/vvc/alf.asm
+++ b/libavcodec/x86/vvc/alf.asm
@@ -784,15 +784,10 @@ cglobal vvc_alf_classify_grad_%1bpc, 6, 14, 12, 
gradient_sum, src, src_stride, w
     pblendvb          m2, m5, m8, m1     ; hvd1
     pblendvb          m3, m6, m3, m1     ; hvd0
 
-%if ps != 1  ; high bit depth
-    movd             xm5, bit_depthd
-    vpbroadcastd      m5, xm5
-%endif
-
     ;*class_idx = arg_var[av_clip_uintp2(sum_hv * ac >> (BIT_DEPTH - 1), 4)];
     pmulld            m0, m9             ; sum_hv * ac
 %if ps != 1
-    vpsrlvd           m0, m0, m5
+    vpsrlvd           m0, m0, m11
 %else
     psrld             m0, 7
 %endif
@@ -844,11 +839,13 @@ cglobal vvc_alf_classify_grad_%1bpc, 6, 14, 12, 
gradient_sum, src, src_stride, w
 %macro ALF_CLASSIFY 1
 %define ps (%1 / 8)
 ALF_CLASSIFY_GRAD %1
-cglobal vvc_alf_classify_%1bpc, 7, 14, 11, class_idx, transpose_idx, 
gradient_sum, width, height, vb_pos, bit_depth, \
+cglobal vvc_alf_classify_%1bpc, 7, 14, 11+(ps!=1), class_idx, transpose_idx, 
gradient_sum, width, height, vb_pos, bit_depth, \
     x, y, grad, sum_stride, sum_stride3, temp, w
 
 %if ps != 1
     sub       bit_depthd, 1
+    movd            xm11, bit_depthd
+    vpbroadcastd     m11, xm11
 %endif
 
     ; now we can use gradient to get class idx and transpose idx

_______________________________________________
ffmpeg-cvslog mailing list -- [email protected]
To unsubscribe send an email to [email protected]

Reply via email to