swscale/x86/output: Simplify creating dither register

Only the lower quadword needs to be rotated, because
the register is zero-extended immediately afterwards anyway.

Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
This commit is contained in:
Andreas Rheinhardt
2026-04-10 02:15:51 +02:00
parent f5c5bca803
commit 0bb161fd09

View File

@@ -253,8 +253,10 @@ cglobal yuv2planeX_%1, %3, 8, %2, filter, fltsize, src, dst, w, dither, offset
jz .no_rot
%if mmsize == 16
punpcklqdq m_dith, m_dith
%endif ; mmsize == 16
psrldq m_dith, 3
%else
PALIGNR m_dith, m_dith, 3, m0
%endif ; mmsize == 16
.no_rot:
%if mmsize == 16
punpcklbw m_dith, m6