1
0
mirror of https://github.com/bitdefender/bddisasm.git synced 2024-12-23 06:28:13 +00:00
bddisasm/bddisasm_test/x86/avx512/avx512bw_64.asm
BITDEFENDER\vlutas 9ba1e6a2f9 Added support for new Intel instructions, per Intel ISA extensions document #319433-046 (September 2022): PREFETCHITI, RAO-INT, CMPCCXADD, WRMSRNS, MSRLIST, AMX-FP16, AVX-IFMA, AVX-NE-CONVERT, AVX-VNNI-INT8.
Multiple minor fixes to existing instructions.
Moved x86 decoding tests in a separate directory & improved the test script.
2022-10-04 12:22:59 +03:00

2746 lines
104 KiB
NASM

bits 64
kaddd k3, k7, k1
kaddq k3, k7, k1
kandd k3, k7, k1
kandnd k3, k7, k1
kandnq k3, k7, k1
kandq k3, k7, k1
kmovd k3, [rbx]
kmovd k3, [rbx+rsi*8+256]
kmovd k3, [rbx+rsi*8-256]
kmovd k3, k1
kmovd k3, [rbx]
kmovd [rbx], k3
kmovd [rbx+rsi*8+256], k3
kmovd [rbx+rsi*8-256], k3
kmovd k3, ecx
kmovd ecx, k1
kmovq k3, [rbx]
kmovq k3, [rbx+rsi*8+256]
kmovq k3, [rbx+rsi*8-256]
kmovq k3, k1
kmovq k3, [rbx]
kmovq [rbx], k3
kmovq [rbx+rsi*8+256], k3
kmovq [rbx+rsi*8-256], k3
kmovq k3, rcx
kmovq rcx, k1
knotd k3, k1
knotq k3, k1
kord k3, k7, k1
korq k3, k7, k1
kortestd k3, k1
kortestq k3, k1
kshiftld k3, k1, 10
kshiftlq k3, k1, 10
kshiftrd k3, k1, 10
kshiftrq k3, k1, 10
ktestd k3, k1
ktestq k3, k1
kunpckdq k3, k7, k1
kunpckwd k3, k7, k1
kxnord k3, k7, k1
kxnorq k3, k7, k1
kxord k3, k7, k1
kxorq k3, k7, k1
vdbpsadbw xmm2, xmm7, xmm0, 10
vdbpsadbw xmm2, xmm7, [rbx], 10
vdbpsadbw xmm2, xmm7, [rbx+r11*8+256], 10
vdbpsadbw xmm2, xmm7, [rbx+r11*8-256], 10
vdbpsadbw xmm2{k5}, xmm7, xmm0, 10
vdbpsadbw xmm2{k5}, xmm7, [rbx], 10
vdbpsadbw xmm2{k5}, xmm7, [rbx+r11*8+256], 10
vdbpsadbw xmm2{k5}, xmm7, [rbx+r11*8-256], 10
vdbpsadbw xmm2{k5}{z}, xmm7, xmm0, 10
vdbpsadbw xmm2{k5}{z}, xmm7, [rbx], 10
vdbpsadbw xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10
vdbpsadbw xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10
vdbpsadbw ymm16, ymm13, ymm15, 10
vdbpsadbw ymm16, ymm13, [rbx], 10
vdbpsadbw ymm16, ymm13, [rbx+r11*8+256], 10
vdbpsadbw ymm16, ymm13, [rbx+r11*8-256], 10
vdbpsadbw ymm16{k5}, ymm13, ymm15, 10
vdbpsadbw ymm16{k5}, ymm13, [rbx], 10
vdbpsadbw ymm16{k5}, ymm13, [rbx+r11*8+256], 10
vdbpsadbw ymm16{k5}, ymm13, [rbx+r11*8-256], 10
vdbpsadbw ymm16{k5}{z}, ymm13, ymm15, 10
vdbpsadbw ymm16{k5}{z}, ymm13, [rbx], 10
vdbpsadbw ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10
vdbpsadbw ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10
vdbpsadbw zmm24, zmm24, zmm31, 10
vdbpsadbw zmm24, zmm24, [rbx], 10
vdbpsadbw zmm24, zmm24, [rbx+r11*8+256], 10
vdbpsadbw zmm24, zmm24, [rbx+r11*8-256], 10
vdbpsadbw zmm24{k5}, zmm24, zmm31, 10
vdbpsadbw zmm24{k5}, zmm24, [rbx], 10
vdbpsadbw zmm24{k5}, zmm24, [rbx+r11*8+256], 10
vdbpsadbw zmm24{k5}, zmm24, [rbx+r11*8-256], 10
vdbpsadbw zmm24{k5}{z}, zmm24, zmm31, 10
vdbpsadbw zmm24{k5}{z}, zmm24, [rbx], 10
vdbpsadbw zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10
vdbpsadbw zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10
vmovdqu16 xmm2, xmm0
vmovdqu16 xmm2, [rbx]
vmovdqu16 xmm2, [rbx+r11*8+256]
vmovdqu16 xmm2, [rbx+r11*8-256]
vmovdqu16 xmm2{k5}, xmm0
vmovdqu16 xmm2{k5}, [rbx]
vmovdqu16 xmm2{k5}, [rbx+r11*8+256]
vmovdqu16 xmm2{k5}, [rbx+r11*8-256]
vmovdqu16 xmm2{k5}{z}, xmm0
vmovdqu16 xmm2{k5}{z}, [rbx]
vmovdqu16 xmm2{k5}{z}, [rbx+r11*8+256]
vmovdqu16 xmm2{k5}{z}, [rbx+r11*8-256]
vmovdqu16 ymm16, ymm15
vmovdqu16 ymm16, [rbx]
vmovdqu16 ymm16, [rbx+r11*8+256]
vmovdqu16 ymm16, [rbx+r11*8-256]
vmovdqu16 ymm16{k5}, ymm15
vmovdqu16 ymm16{k5}, [rbx]
vmovdqu16 ymm16{k5}, [rbx+r11*8+256]
vmovdqu16 ymm16{k5}, [rbx+r11*8-256]
vmovdqu16 ymm16{k5}{z}, ymm15
vmovdqu16 ymm16{k5}{z}, [rbx]
vmovdqu16 ymm16{k5}{z}, [rbx+r11*8+256]
vmovdqu16 ymm16{k5}{z}, [rbx+r11*8-256]
vmovdqu16 zmm24, zmm31
vmovdqu16 zmm24, [rbx]
vmovdqu16 zmm24, [rbx+r11*8+256]
vmovdqu16 zmm24, [rbx+r11*8-256]
vmovdqu16 zmm24{k5}, zmm31
vmovdqu16 zmm24{k5}, [rbx]
vmovdqu16 zmm24{k5}, [rbx+r11*8+256]
vmovdqu16 zmm24{k5}, [rbx+r11*8-256]
vmovdqu16 zmm24{k5}{z}, zmm31
vmovdqu16 zmm24{k5}{z}, [rbx]
vmovdqu16 zmm24{k5}{z}, [rbx+r11*8+256]
vmovdqu16 zmm24{k5}{z}, [rbx+r11*8-256]
vmovdqu16 xmm0, xmm2
vmovdqu16 ymm15, ymm16
vmovdqu16 zmm31, zmm24
vmovdqu16 [rbx], xmm2
vmovdqu16 [rbx], ymm16
vmovdqu16 [rbx], zmm24
vmovdqu16 [rbx+r11*8+256], xmm2
vmovdqu16 [rbx+r11*8+256], ymm16
vmovdqu16 [rbx+r11*8+256], zmm24
vmovdqu16 [rbx+r11*8-256], xmm2
vmovdqu16 [rbx+r11*8-256], ymm16
vmovdqu16 [rbx+r11*8-256], zmm24
vmovdqu8 xmm2, xmm0
vmovdqu8 xmm2, [rbx]
vmovdqu8 xmm2, [rbx+r11*8+256]
vmovdqu8 xmm2, [rbx+r11*8-256]
vmovdqu8 xmm2{k5}, xmm0
vmovdqu8 xmm2{k5}, [rbx]
vmovdqu8 xmm2{k5}, [rbx+r11*8+256]
vmovdqu8 xmm2{k5}, [rbx+r11*8-256]
vmovdqu8 xmm2{k5}{z}, xmm0
vmovdqu8 xmm2{k5}{z}, [rbx]
vmovdqu8 xmm2{k5}{z}, [rbx+r11*8+256]
vmovdqu8 xmm2{k5}{z}, [rbx+r11*8-256]
vmovdqu8 ymm16, ymm15
vmovdqu8 ymm16, [rbx]
vmovdqu8 ymm16, [rbx+r11*8+256]
vmovdqu8 ymm16, [rbx+r11*8-256]
vmovdqu8 ymm16{k5}, ymm15
vmovdqu8 ymm16{k5}, [rbx]
vmovdqu8 ymm16{k5}, [rbx+r11*8+256]
vmovdqu8 ymm16{k5}, [rbx+r11*8-256]
vmovdqu8 ymm16{k5}{z}, ymm15
vmovdqu8 ymm16{k5}{z}, [rbx]
vmovdqu8 ymm16{k5}{z}, [rbx+r11*8+256]
vmovdqu8 ymm16{k5}{z}, [rbx+r11*8-256]
vmovdqu8 zmm24, zmm31
vmovdqu8 zmm24, [rbx]
vmovdqu8 zmm24, [rbx+r11*8+256]
vmovdqu8 zmm24, [rbx+r11*8-256]
vmovdqu8 zmm24{k5}, zmm31
vmovdqu8 zmm24{k5}, [rbx]
vmovdqu8 zmm24{k5}, [rbx+r11*8+256]
vmovdqu8 zmm24{k5}, [rbx+r11*8-256]
vmovdqu8 zmm24{k5}{z}, zmm31
vmovdqu8 zmm24{k5}{z}, [rbx]
vmovdqu8 zmm24{k5}{z}, [rbx+r11*8+256]
vmovdqu8 zmm24{k5}{z}, [rbx+r11*8-256]
vmovdqu8 xmm0, xmm2
vmovdqu8 ymm15, ymm16
vmovdqu8 zmm31, zmm24
vmovdqu8 [rbx], xmm2
vmovdqu8 [rbx], ymm16
vmovdqu8 [rbx], zmm24
vmovdqu8 [rbx+r11*8+256], xmm2
vmovdqu8 [rbx+r11*8+256], ymm16
vmovdqu8 [rbx+r11*8+256], zmm24
vmovdqu8 [rbx+r11*8-256], xmm2
vmovdqu8 [rbx+r11*8-256], ymm16
vmovdqu8 [rbx+r11*8-256], zmm24
vpabsb xmm2, xmm0
vpabsb xmm2, [rbx]
vpabsb xmm2, [rbx+r11*8+256]
vpabsb xmm2, [rbx+r11*8-256]
vpabsb xmm2{k5}, xmm0
vpabsb xmm2{k5}, [rbx]
vpabsb xmm2{k5}, [rbx+r11*8+256]
vpabsb xmm2{k5}, [rbx+r11*8-256]
vpabsb xmm2{k5}{z}, xmm0
vpabsb xmm2{k5}{z}, [rbx]
vpabsb xmm2{k5}{z}, [rbx+r11*8+256]
vpabsb xmm2{k5}{z}, [rbx+r11*8-256]
vpabsb ymm16, ymm15
vpabsb ymm16, [rbx]
vpabsb ymm16, [rbx+r11*8+256]
vpabsb ymm16, [rbx+r11*8-256]
vpabsb ymm16{k5}, ymm15
vpabsb ymm16{k5}, [rbx]
vpabsb ymm16{k5}, [rbx+r11*8+256]
vpabsb ymm16{k5}, [rbx+r11*8-256]
vpabsb ymm16{k5}{z}, ymm15
vpabsb ymm16{k5}{z}, [rbx]
vpabsb ymm16{k5}{z}, [rbx+r11*8+256]
vpabsb ymm16{k5}{z}, [rbx+r11*8-256]
vpabsb zmm24, zmm31
vpabsb zmm24, [rbx]
vpabsb zmm24, [rbx+r11*8+256]
vpabsb zmm24, [rbx+r11*8-256]
vpabsb zmm24{k5}, zmm31
vpabsb zmm24{k5}, [rbx]
vpabsb zmm24{k5}, [rbx+r11*8+256]
vpabsb zmm24{k5}, [rbx+r11*8-256]
vpabsb zmm24{k5}{z}, zmm31
vpabsb zmm24{k5}{z}, [rbx]
vpabsb zmm24{k5}{z}, [rbx+r11*8+256]
vpabsb zmm24{k5}{z}, [rbx+r11*8-256]
vpabsw xmm2, xmm0
vpabsw xmm2, [rbx]
vpabsw xmm2, [rbx+r11*8+256]
vpabsw xmm2, [rbx+r11*8-256]
vpabsw xmm2{k5}, xmm0
vpabsw xmm2{k5}, [rbx]
vpabsw xmm2{k5}, [rbx+r11*8+256]
vpabsw xmm2{k5}, [rbx+r11*8-256]
vpabsw xmm2{k5}{z}, xmm0
vpabsw xmm2{k5}{z}, [rbx]
vpabsw xmm2{k5}{z}, [rbx+r11*8+256]
vpabsw xmm2{k5}{z}, [rbx+r11*8-256]
vpabsw ymm16, ymm15
vpabsw ymm16, [rbx]
vpabsw ymm16, [rbx+r11*8+256]
vpabsw ymm16, [rbx+r11*8-256]
vpabsw ymm16{k5}, ymm15
vpabsw ymm16{k5}, [rbx]
vpabsw ymm16{k5}, [rbx+r11*8+256]
vpabsw ymm16{k5}, [rbx+r11*8-256]
vpabsw ymm16{k5}{z}, ymm15
vpabsw ymm16{k5}{z}, [rbx]
vpabsw ymm16{k5}{z}, [rbx+r11*8+256]
vpabsw ymm16{k5}{z}, [rbx+r11*8-256]
vpabsw zmm24, zmm31
vpabsw zmm24, [rbx]
vpabsw zmm24, [rbx+r11*8+256]
vpabsw zmm24, [rbx+r11*8-256]
vpabsw zmm24{k5}, zmm31
vpabsw zmm24{k5}, [rbx]
vpabsw zmm24{k5}, [rbx+r11*8+256]
vpabsw zmm24{k5}, [rbx+r11*8-256]
vpabsw zmm24{k5}{z}, zmm31
vpabsw zmm24{k5}{z}, [rbx]
vpabsw zmm24{k5}{z}, [rbx+r11*8+256]
vpabsw zmm24{k5}{z}, [rbx+r11*8-256]
vpackssdw xmm2, xmm7, xmm0
vpackssdw xmm2, xmm7, [rbx]
vpackssdw xmm2, xmm7, [rbx]{1to4}
vpackssdw xmm2, xmm7, [rbx+r11*8+256]
vpackssdw xmm2, xmm7, [rbx+r11*8-256]
vpackssdw xmm2{k5}, xmm7, xmm0
vpackssdw xmm2{k5}, xmm7, [rbx]
vpackssdw xmm2{k5}, xmm7, [rbx]{1to4}
vpackssdw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpackssdw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpackssdw xmm2{k5}{z}, xmm7, xmm0
vpackssdw xmm2{k5}{z}, xmm7, [rbx]
vpackssdw xmm2{k5}{z}, xmm7, [rbx]{1to4}
vpackssdw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpackssdw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpackssdw ymm16, ymm13, ymm15
vpackssdw ymm16, ymm13, [rbx]
vpackssdw ymm16, ymm13, [rbx]{1to8}
vpackssdw ymm16, ymm13, [rbx+r11*8+256]
vpackssdw ymm16, ymm13, [rbx+r11*8-256]
vpackssdw ymm16{k5}, ymm13, ymm15
vpackssdw ymm16{k5}, ymm13, [rbx]
vpackssdw ymm16{k5}, ymm13, [rbx]{1to8}
vpackssdw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpackssdw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpackssdw ymm16{k5}{z}, ymm13, ymm15
vpackssdw ymm16{k5}{z}, ymm13, [rbx]
vpackssdw ymm16{k5}{z}, ymm13, [rbx]{1to8}
vpackssdw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpackssdw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpackssdw zmm24, zmm24, zmm31
vpackssdw zmm24, zmm24, [rbx]
vpackssdw zmm24, zmm24, [rbx]{1to16}
vpackssdw zmm24, zmm24, [rbx+r11*8+256]
vpackssdw zmm24, zmm24, [rbx+r11*8-256]
vpackssdw zmm24{k5}, zmm24, zmm31
vpackssdw zmm24{k5}, zmm24, [rbx]
vpackssdw zmm24{k5}, zmm24, [rbx]{1to16}
vpackssdw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpackssdw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpackssdw zmm24{k5}{z}, zmm24, zmm31
vpackssdw zmm24{k5}{z}, zmm24, [rbx]
vpackssdw zmm24{k5}{z}, zmm24, [rbx]{1to16}
vpackssdw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpackssdw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpacksswb xmm2, xmm7, xmm0
vpacksswb xmm2, xmm7, [rbx]
vpacksswb xmm2, xmm7, [rbx+r11*8+256]
vpacksswb xmm2, xmm7, [rbx+r11*8-256]
vpacksswb xmm2{k5}, xmm7, xmm0
vpacksswb xmm2{k5}, xmm7, [rbx]
vpacksswb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpacksswb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpacksswb xmm2{k5}{z}, xmm7, xmm0
vpacksswb xmm2{k5}{z}, xmm7, [rbx]
vpacksswb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpacksswb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpacksswb ymm16, ymm13, ymm15
vpacksswb ymm16, ymm13, [rbx]
vpacksswb ymm16, ymm13, [rbx+r11*8+256]
vpacksswb ymm16, ymm13, [rbx+r11*8-256]
vpacksswb ymm16{k5}, ymm13, ymm15
vpacksswb ymm16{k5}, ymm13, [rbx]
vpacksswb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpacksswb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpacksswb ymm16{k5}{z}, ymm13, ymm15
vpacksswb ymm16{k5}{z}, ymm13, [rbx]
vpacksswb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpacksswb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpacksswb zmm24, zmm24, zmm31
vpacksswb zmm24, zmm24, [rbx]
vpacksswb zmm24, zmm24, [rbx+r11*8+256]
vpacksswb zmm24, zmm24, [rbx+r11*8-256]
vpacksswb zmm24{k5}, zmm24, zmm31
vpacksswb zmm24{k5}, zmm24, [rbx]
vpacksswb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpacksswb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpacksswb zmm24{k5}{z}, zmm24, zmm31
vpacksswb zmm24{k5}{z}, zmm24, [rbx]
vpacksswb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpacksswb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpackusdw xmm2, xmm7, xmm0
vpackusdw xmm2, xmm7, [rbx]
vpackusdw xmm2, xmm7, [rbx]{1to4}
vpackusdw xmm2, xmm7, [rbx+r11*8+256]
vpackusdw xmm2, xmm7, [rbx+r11*8-256]
vpackusdw xmm2{k5}, xmm7, xmm0
vpackusdw xmm2{k5}, xmm7, [rbx]
vpackusdw xmm2{k5}, xmm7, [rbx]{1to4}
vpackusdw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpackusdw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpackusdw xmm2{k5}{z}, xmm7, xmm0
vpackusdw xmm2{k5}{z}, xmm7, [rbx]
vpackusdw xmm2{k5}{z}, xmm7, [rbx]{1to4}
vpackusdw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpackusdw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpackusdw ymm16, ymm13, ymm15
vpackusdw ymm16, ymm13, [rbx]
vpackusdw ymm16, ymm13, [rbx]{1to8}
vpackusdw ymm16, ymm13, [rbx+r11*8+256]
vpackusdw ymm16, ymm13, [rbx+r11*8-256]
vpackusdw ymm16{k5}, ymm13, ymm15
vpackusdw ymm16{k5}, ymm13, [rbx]
vpackusdw ymm16{k5}, ymm13, [rbx]{1to8}
vpackusdw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpackusdw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpackusdw ymm16{k5}{z}, ymm13, ymm15
vpackusdw ymm16{k5}{z}, ymm13, [rbx]
vpackusdw ymm16{k5}{z}, ymm13, [rbx]{1to8}
vpackusdw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpackusdw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpackusdw zmm24, zmm24, zmm31
vpackusdw zmm24, zmm24, [rbx]
vpackusdw zmm24, zmm24, [rbx]{1to16}
vpackusdw zmm24, zmm24, [rbx+r11*8+256]
vpackusdw zmm24, zmm24, [rbx+r11*8-256]
vpackusdw zmm24{k5}, zmm24, zmm31
vpackusdw zmm24{k5}, zmm24, [rbx]
vpackusdw zmm24{k5}, zmm24, [rbx]{1to16}
vpackusdw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpackusdw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpackusdw zmm24{k5}{z}, zmm24, zmm31
vpackusdw zmm24{k5}{z}, zmm24, [rbx]
vpackusdw zmm24{k5}{z}, zmm24, [rbx]{1to16}
vpackusdw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpackusdw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpackuswb xmm2, xmm7, xmm0
vpackuswb xmm2, xmm7, [rbx]
vpackuswb xmm2, xmm7, [rbx+r11*8+256]
vpackuswb xmm2, xmm7, [rbx+r11*8-256]
vpackuswb xmm2{k5}, xmm7, xmm0
vpackuswb xmm2{k5}, xmm7, [rbx]
vpackuswb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpackuswb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpackuswb xmm2{k5}{z}, xmm7, xmm0
vpackuswb xmm2{k5}{z}, xmm7, [rbx]
vpackuswb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpackuswb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpackuswb ymm16, ymm13, ymm15
vpackuswb ymm16, ymm13, [rbx]
vpackuswb ymm16, ymm13, [rbx+r11*8+256]
vpackuswb ymm16, ymm13, [rbx+r11*8-256]
vpackuswb ymm16{k5}, ymm13, ymm15
vpackuswb ymm16{k5}, ymm13, [rbx]
vpackuswb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpackuswb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpackuswb ymm16{k5}{z}, ymm13, ymm15
vpackuswb ymm16{k5}{z}, ymm13, [rbx]
vpackuswb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpackuswb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpackuswb zmm24, zmm24, zmm31
vpackuswb zmm24, zmm24, [rbx]
vpackuswb zmm24, zmm24, [rbx+r11*8+256]
vpackuswb zmm24, zmm24, [rbx+r11*8-256]
vpackuswb zmm24{k5}, zmm24, zmm31
vpackuswb zmm24{k5}, zmm24, [rbx]
vpackuswb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpackuswb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpackuswb zmm24{k5}{z}, zmm24, zmm31
vpackuswb zmm24{k5}{z}, zmm24, [rbx]
vpackuswb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpackuswb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpaddb xmm2, xmm7, xmm0
vpaddb xmm2, xmm7, [rbx]
vpaddb xmm2, xmm7, [rbx+r11*8+256]
vpaddb xmm2, xmm7, [rbx+r11*8-256]
vpaddb xmm2{k5}, xmm7, xmm0
vpaddb xmm2{k5}, xmm7, [rbx]
vpaddb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpaddb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpaddb xmm2{k5}{z}, xmm7, xmm0
vpaddb xmm2{k5}{z}, xmm7, [rbx]
vpaddb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpaddb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpaddb ymm16, ymm13, ymm15
vpaddb ymm16, ymm13, [rbx]
vpaddb ymm16, ymm13, [rbx+r11*8+256]
vpaddb ymm16, ymm13, [rbx+r11*8-256]
vpaddb ymm16{k5}, ymm13, ymm15
vpaddb ymm16{k5}, ymm13, [rbx]
vpaddb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpaddb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpaddb ymm16{k5}{z}, ymm13, ymm15
vpaddb ymm16{k5}{z}, ymm13, [rbx]
vpaddb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpaddb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpaddb zmm24, zmm24, zmm31
vpaddb zmm24, zmm24, [rbx]
vpaddb zmm24, zmm24, [rbx+r11*8+256]
vpaddb zmm24, zmm24, [rbx+r11*8-256]
vpaddb zmm24{k5}, zmm24, zmm31
vpaddb zmm24{k5}, zmm24, [rbx]
vpaddb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpaddb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpaddb zmm24{k5}{z}, zmm24, zmm31
vpaddb zmm24{k5}{z}, zmm24, [rbx]
vpaddb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpaddb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpaddsb xmm2, xmm7, xmm0
vpaddsb xmm2, xmm7, [rbx]
vpaddsb xmm2, xmm7, [rbx+r11*8+256]
vpaddsb xmm2, xmm7, [rbx+r11*8-256]
vpaddsb xmm2{k5}, xmm7, xmm0
vpaddsb xmm2{k5}, xmm7, [rbx]
vpaddsb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpaddsb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpaddsb xmm2{k5}{z}, xmm7, xmm0
vpaddsb xmm2{k5}{z}, xmm7, [rbx]
vpaddsb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpaddsb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpaddsb ymm16, ymm13, ymm15
vpaddsb ymm16, ymm13, [rbx]
vpaddsb ymm16, ymm13, [rbx+r11*8+256]
vpaddsb ymm16, ymm13, [rbx+r11*8-256]
vpaddsb ymm16{k5}, ymm13, ymm15
vpaddsb ymm16{k5}, ymm13, [rbx]
vpaddsb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpaddsb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpaddsb ymm16{k5}{z}, ymm13, ymm15
vpaddsb ymm16{k5}{z}, ymm13, [rbx]
vpaddsb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpaddsb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpaddsb zmm24, zmm24, zmm31
vpaddsb zmm24, zmm24, [rbx]
vpaddsb zmm24, zmm24, [rbx+r11*8+256]
vpaddsb zmm24, zmm24, [rbx+r11*8-256]
vpaddsb zmm24{k5}, zmm24, zmm31
vpaddsb zmm24{k5}, zmm24, [rbx]
vpaddsb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpaddsb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpaddsb zmm24{k5}{z}, zmm24, zmm31
vpaddsb zmm24{k5}{z}, zmm24, [rbx]
vpaddsb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpaddsb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpaddsw xmm2, xmm7, xmm0
vpaddsw xmm2, xmm7, [rbx]
vpaddsw xmm2, xmm7, [rbx+r11*8+256]
vpaddsw xmm2, xmm7, [rbx+r11*8-256]
vpaddsw xmm2{k5}, xmm7, xmm0
vpaddsw xmm2{k5}, xmm7, [rbx]
vpaddsw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpaddsw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpaddsw xmm2{k5}{z}, xmm7, xmm0
vpaddsw xmm2{k5}{z}, xmm7, [rbx]
vpaddsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpaddsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpaddsw ymm16, ymm13, ymm15
vpaddsw ymm16, ymm13, [rbx]
vpaddsw ymm16, ymm13, [rbx+r11*8+256]
vpaddsw ymm16, ymm13, [rbx+r11*8-256]
vpaddsw ymm16{k5}, ymm13, ymm15
vpaddsw ymm16{k5}, ymm13, [rbx]
vpaddsw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpaddsw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpaddsw ymm16{k5}{z}, ymm13, ymm15
vpaddsw ymm16{k5}{z}, ymm13, [rbx]
vpaddsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpaddsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpaddsw zmm24, zmm24, zmm31
vpaddsw zmm24, zmm24, [rbx]
vpaddsw zmm24, zmm24, [rbx+r11*8+256]
vpaddsw zmm24, zmm24, [rbx+r11*8-256]
vpaddsw zmm24{k5}, zmm24, zmm31
vpaddsw zmm24{k5}, zmm24, [rbx]
vpaddsw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpaddsw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpaddsw zmm24{k5}{z}, zmm24, zmm31
vpaddsw zmm24{k5}{z}, zmm24, [rbx]
vpaddsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpaddsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpaddusb xmm2, xmm7, xmm0
vpaddusb xmm2, xmm7, [rbx]
vpaddusb xmm2, xmm7, [rbx+r11*8+256]
vpaddusb xmm2, xmm7, [rbx+r11*8-256]
vpaddusb xmm2{k5}, xmm7, xmm0
vpaddusb xmm2{k5}, xmm7, [rbx]
vpaddusb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpaddusb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpaddusb xmm2{k5}{z}, xmm7, xmm0
vpaddusb xmm2{k5}{z}, xmm7, [rbx]
vpaddusb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpaddusb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpaddusb ymm16, ymm13, ymm15
vpaddusb ymm16, ymm13, [rbx]
vpaddusb ymm16, ymm13, [rbx+r11*8+256]
vpaddusb ymm16, ymm13, [rbx+r11*8-256]
vpaddusb ymm16{k5}, ymm13, ymm15
vpaddusb ymm16{k5}, ymm13, [rbx]
vpaddusb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpaddusb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpaddusb ymm16{k5}{z}, ymm13, ymm15
vpaddusb ymm16{k5}{z}, ymm13, [rbx]
vpaddusb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpaddusb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpaddusb zmm24, zmm24, zmm31
vpaddusb zmm24, zmm24, [rbx]
vpaddusb zmm24, zmm24, [rbx+r11*8+256]
vpaddusb zmm24, zmm24, [rbx+r11*8-256]
vpaddusb zmm24{k5}, zmm24, zmm31
vpaddusb zmm24{k5}, zmm24, [rbx]
vpaddusb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpaddusb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpaddusb zmm24{k5}{z}, zmm24, zmm31
vpaddusb zmm24{k5}{z}, zmm24, [rbx]
vpaddusb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpaddusb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpaddusw xmm2, xmm7, xmm0
vpaddusw xmm2, xmm7, [rbx]
vpaddusw xmm2, xmm7, [rbx+r11*8+256]
vpaddusw xmm2, xmm7, [rbx+r11*8-256]
vpaddusw xmm2{k5}, xmm7, xmm0
vpaddusw xmm2{k5}, xmm7, [rbx]
vpaddusw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpaddusw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpaddusw xmm2{k5}{z}, xmm7, xmm0
vpaddusw xmm2{k5}{z}, xmm7, [rbx]
vpaddusw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpaddusw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpaddusw ymm16, ymm13, ymm15
vpaddusw ymm16, ymm13, [rbx]
vpaddusw ymm16, ymm13, [rbx+r11*8+256]
vpaddusw ymm16, ymm13, [rbx+r11*8-256]
vpaddusw ymm16{k5}, ymm13, ymm15
vpaddusw ymm16{k5}, ymm13, [rbx]
vpaddusw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpaddusw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpaddusw ymm16{k5}{z}, ymm13, ymm15
vpaddusw ymm16{k5}{z}, ymm13, [rbx]
vpaddusw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpaddusw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpaddusw zmm24, zmm24, zmm31
vpaddusw zmm24, zmm24, [rbx]
vpaddusw zmm24, zmm24, [rbx+r11*8+256]
vpaddusw zmm24, zmm24, [rbx+r11*8-256]
vpaddusw zmm24{k5}, zmm24, zmm31
vpaddusw zmm24{k5}, zmm24, [rbx]
vpaddusw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpaddusw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpaddusw zmm24{k5}{z}, zmm24, zmm31
vpaddusw zmm24{k5}{z}, zmm24, [rbx]
vpaddusw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpaddusw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpaddw xmm2, xmm7, xmm0
vpaddw xmm2, xmm7, [rbx]
vpaddw xmm2, xmm7, [rbx+r11*8+256]
vpaddw xmm2, xmm7, [rbx+r11*8-256]
vpaddw xmm2{k5}, xmm7, xmm0
vpaddw xmm2{k5}, xmm7, [rbx]
vpaddw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpaddw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpaddw xmm2{k5}{z}, xmm7, xmm0
vpaddw xmm2{k5}{z}, xmm7, [rbx]
vpaddw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpaddw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpaddw ymm16, ymm13, ymm15
vpaddw ymm16, ymm13, [rbx]
vpaddw ymm16, ymm13, [rbx+r11*8+256]
vpaddw ymm16, ymm13, [rbx+r11*8-256]
vpaddw ymm16{k5}, ymm13, ymm15
vpaddw ymm16{k5}, ymm13, [rbx]
vpaddw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpaddw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpaddw ymm16{k5}{z}, ymm13, ymm15
vpaddw ymm16{k5}{z}, ymm13, [rbx]
vpaddw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpaddw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpaddw zmm24, zmm24, zmm31
vpaddw zmm24, zmm24, [rbx]
vpaddw zmm24, zmm24, [rbx+r11*8+256]
vpaddw zmm24, zmm24, [rbx+r11*8-256]
vpaddw zmm24{k5}, zmm24, zmm31
vpaddw zmm24{k5}, zmm24, [rbx]
vpaddw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpaddw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpaddw zmm24{k5}{z}, zmm24, zmm31
vpaddw zmm24{k5}{z}, zmm24, [rbx]
vpaddw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpaddw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpalignr xmm2, xmm7, xmm0, 10
vpalignr xmm2, xmm7, [rbx], 10
vpalignr xmm2, xmm7, [rbx+r11*8+256], 10
vpalignr xmm2, xmm7, [rbx+r11*8-256], 10
vpalignr xmm2{k5}, xmm7, xmm0, 10
vpalignr xmm2{k5}, xmm7, [rbx], 10
vpalignr xmm2{k5}, xmm7, [rbx+r11*8+256], 10
vpalignr xmm2{k5}, xmm7, [rbx+r11*8-256], 10
vpalignr xmm2{k5}{z}, xmm7, xmm0, 10
vpalignr xmm2{k5}{z}, xmm7, [rbx], 10
vpalignr xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10
vpalignr xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10
vpalignr ymm16, ymm13, ymm15, 10
vpalignr ymm16, ymm13, [rbx], 10
vpalignr ymm16, ymm13, [rbx+r11*8+256], 10
vpalignr ymm16, ymm13, [rbx+r11*8-256], 10
vpalignr ymm16{k5}, ymm13, ymm15, 10
vpalignr ymm16{k5}, ymm13, [rbx], 10
vpalignr ymm16{k5}, ymm13, [rbx+r11*8+256], 10
vpalignr ymm16{k5}, ymm13, [rbx+r11*8-256], 10
vpalignr ymm16{k5}{z}, ymm13, ymm15, 10
vpalignr ymm16{k5}{z}, ymm13, [rbx], 10
vpalignr ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10
vpalignr ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10
vpalignr zmm24, zmm24, zmm31, 10
vpalignr zmm24, zmm24, [rbx], 10
vpalignr zmm24, zmm24, [rbx+r11*8+256], 10
vpalignr zmm24, zmm24, [rbx+r11*8-256], 10
vpalignr zmm24{k5}, zmm24, zmm31, 10
vpalignr zmm24{k5}, zmm24, [rbx], 10
vpalignr zmm24{k5}, zmm24, [rbx+r11*8+256], 10
vpalignr zmm24{k5}, zmm24, [rbx+r11*8-256], 10
vpalignr zmm24{k5}{z}, zmm24, zmm31, 10
vpalignr zmm24{k5}{z}, zmm24, [rbx], 10
vpalignr zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10
vpalignr zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10
vpavgb xmm2, xmm7, xmm0
vpavgb xmm2, xmm7, [rbx]
vpavgb xmm2, xmm7, [rbx+r11*8+256]
vpavgb xmm2, xmm7, [rbx+r11*8-256]
vpavgb xmm2{k5}, xmm7, xmm0
vpavgb xmm2{k5}, xmm7, [rbx]
vpavgb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpavgb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpavgb xmm2{k5}{z}, xmm7, xmm0
vpavgb xmm2{k5}{z}, xmm7, [rbx]
vpavgb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpavgb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpavgb ymm16, ymm13, ymm15
vpavgb ymm16, ymm13, [rbx]
vpavgb ymm16, ymm13, [rbx+r11*8+256]
vpavgb ymm16, ymm13, [rbx+r11*8-256]
vpavgb ymm16{k5}, ymm13, ymm15
vpavgb ymm16{k5}, ymm13, [rbx]
vpavgb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpavgb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpavgb ymm16{k5}{z}, ymm13, ymm15
vpavgb ymm16{k5}{z}, ymm13, [rbx]
vpavgb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpavgb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpavgb zmm24, zmm24, zmm31
vpavgb zmm24, zmm24, [rbx]
vpavgb zmm24, zmm24, [rbx+r11*8+256]
vpavgb zmm24, zmm24, [rbx+r11*8-256]
vpavgb zmm24{k5}, zmm24, zmm31
vpavgb zmm24{k5}, zmm24, [rbx]
vpavgb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpavgb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpavgb zmm24{k5}{z}, zmm24, zmm31
vpavgb zmm24{k5}{z}, zmm24, [rbx]
vpavgb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpavgb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpavgw xmm2, xmm7, xmm0
vpavgw xmm2, xmm7, [rbx]
vpavgw xmm2, xmm7, [rbx+r11*8+256]
vpavgw xmm2, xmm7, [rbx+r11*8-256]
vpavgw xmm2{k5}, xmm7, xmm0
vpavgw xmm2{k5}, xmm7, [rbx]
vpavgw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpavgw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpavgw xmm2{k5}{z}, xmm7, xmm0
vpavgw xmm2{k5}{z}, xmm7, [rbx]
vpavgw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpavgw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpavgw ymm16, ymm13, ymm15
vpavgw ymm16, ymm13, [rbx]
vpavgw ymm16, ymm13, [rbx+r11*8+256]
vpavgw ymm16, ymm13, [rbx+r11*8-256]
vpavgw ymm16{k5}, ymm13, ymm15
vpavgw ymm16{k5}, ymm13, [rbx]
vpavgw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpavgw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpavgw ymm16{k5}{z}, ymm13, ymm15
vpavgw ymm16{k5}{z}, ymm13, [rbx]
vpavgw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpavgw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpavgw zmm24, zmm24, zmm31
vpavgw zmm24, zmm24, [rbx]
vpavgw zmm24, zmm24, [rbx+r11*8+256]
vpavgw zmm24, zmm24, [rbx+r11*8-256]
vpavgw zmm24{k5}, zmm24, zmm31
vpavgw zmm24{k5}, zmm24, [rbx]
vpavgw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpavgw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpavgw zmm24{k5}{z}, zmm24, zmm31
vpavgw zmm24{k5}{z}, zmm24, [rbx]
vpavgw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpavgw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpblendmb xmm2, xmm7, xmm0
vpblendmb xmm2, xmm7, [rbx]
vpblendmb xmm2, xmm7, [rbx+r11*8+256]
vpblendmb xmm2, xmm7, [rbx+r11*8-256]
vpblendmb xmm2{k5}, xmm7, xmm0
vpblendmb xmm2{k5}, xmm7, [rbx]
vpblendmb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpblendmb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpblendmb xmm2{k5}{z}, xmm7, xmm0
vpblendmb xmm2{k5}{z}, xmm7, [rbx]
vpblendmb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpblendmb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpblendmb ymm16, ymm13, ymm15
vpblendmb ymm16, ymm13, [rbx]
vpblendmb ymm16, ymm13, [rbx+r11*8+256]
vpblendmb ymm16, ymm13, [rbx+r11*8-256]
vpblendmb ymm16{k5}, ymm13, ymm15
vpblendmb ymm16{k5}, ymm13, [rbx]
vpblendmb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpblendmb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpblendmb ymm16{k5}{z}, ymm13, ymm15
vpblendmb ymm16{k5}{z}, ymm13, [rbx]
vpblendmb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpblendmb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpblendmb zmm24, zmm24, zmm31
vpblendmb zmm24, zmm24, [rbx]
vpblendmb zmm24, zmm24, [rbx+r11*8+256]
vpblendmb zmm24, zmm24, [rbx+r11*8-256]
vpblendmb zmm24{k5}, zmm24, zmm31
vpblendmb zmm24{k5}, zmm24, [rbx]
vpblendmb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpblendmb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpblendmb zmm24{k5}{z}, zmm24, zmm31
vpblendmb zmm24{k5}{z}, zmm24, [rbx]
vpblendmb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpblendmb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpblendmw xmm2, xmm7, xmm0
vpblendmw xmm2, xmm7, [rbx]
vpblendmw xmm2, xmm7, [rbx+r11*8+256]
vpblendmw xmm2, xmm7, [rbx+r11*8-256]
vpblendmw xmm2{k5}, xmm7, xmm0
vpblendmw xmm2{k5}, xmm7, [rbx]
vpblendmw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpblendmw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpblendmw xmm2{k5}{z}, xmm7, xmm0
vpblendmw xmm2{k5}{z}, xmm7, [rbx]
vpblendmw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpblendmw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpblendmw ymm16, ymm13, ymm15
vpblendmw ymm16, ymm13, [rbx]
vpblendmw ymm16, ymm13, [rbx+r11*8+256]
vpblendmw ymm16, ymm13, [rbx+r11*8-256]
vpblendmw ymm16{k5}, ymm13, ymm15
vpblendmw ymm16{k5}, ymm13, [rbx]
vpblendmw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpblendmw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpblendmw ymm16{k5}{z}, ymm13, ymm15
vpblendmw ymm16{k5}{z}, ymm13, [rbx]
vpblendmw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpblendmw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpblendmw zmm24, zmm24, zmm31
vpblendmw zmm24, zmm24, [rbx]
vpblendmw zmm24, zmm24, [rbx+r11*8+256]
vpblendmw zmm24, zmm24, [rbx+r11*8-256]
vpblendmw zmm24{k5}, zmm24, zmm31
vpblendmw zmm24{k5}, zmm24, [rbx]
vpblendmw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpblendmw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpblendmw zmm24{k5}{z}, zmm24, zmm31
vpblendmw zmm24{k5}{z}, zmm24, [rbx]
vpblendmw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpblendmw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpbroadcastb xmm2, xmm0
vpbroadcastb xmm2, [rbx]
vpbroadcastb xmm2, [rbx+r11*8+256]
vpbroadcastb xmm2, [rbx+r11*8-256]
vpbroadcastb xmm2{k5}, xmm0
vpbroadcastb xmm2{k5}, [rbx]
vpbroadcastb xmm2{k5}, [rbx+r11*8+256]
vpbroadcastb xmm2{k5}, [rbx+r11*8-256]
vpbroadcastb xmm2{k5}{z}, xmm0
vpbroadcastb xmm2{k5}{z}, [rbx]
vpbroadcastb xmm2{k5}{z}, [rbx+r11*8+256]
vpbroadcastb xmm2{k5}{z}, [rbx+r11*8-256]
vpbroadcastb ymm16, xmm0
vpbroadcastb ymm16, [rbx]
vpbroadcastb ymm16, [rbx+r11*8+256]
vpbroadcastb ymm16, [rbx+r11*8-256]
vpbroadcastb ymm16{k5}, xmm0
vpbroadcastb ymm16{k5}, [rbx]
vpbroadcastb ymm16{k5}, [rbx+r11*8+256]
vpbroadcastb ymm16{k5}, [rbx+r11*8-256]
vpbroadcastb ymm16{k5}{z}, xmm0
vpbroadcastb ymm16{k5}{z}, [rbx]
vpbroadcastb ymm16{k5}{z}, [rbx+r11*8+256]
vpbroadcastb ymm16{k5}{z}, [rbx+r11*8-256]
vpbroadcastb zmm24, xmm0
vpbroadcastb zmm24, [rbx]
vpbroadcastb zmm24, [rbx+r11*8+256]
vpbroadcastb zmm24, [rbx+r11*8-256]
vpbroadcastb zmm24{k5}, xmm0
vpbroadcastb zmm24{k5}, [rbx]
vpbroadcastb zmm24{k5}, [rbx+r11*8+256]
vpbroadcastb zmm24{k5}, [rbx+r11*8-256]
vpbroadcastb zmm24{k5}{z}, xmm0
vpbroadcastb zmm24{k5}{z}, [rbx]
vpbroadcastb zmm24{k5}{z}, [rbx+r11*8+256]
vpbroadcastb zmm24{k5}{z}, [rbx+r11*8-256]
vpbroadcastb xmm2, cl
vpbroadcastb xmm2, cx
vpbroadcastb xmm2, ecx
vpbroadcastb xmm2, rcx
vpbroadcastb xmm2{k5}, cl
vpbroadcastb xmm2{k5}, cx
vpbroadcastb xmm2{k5}, ecx
vpbroadcastb xmm2{k5}, rcx
vpbroadcastb xmm2{k5}{z}, cl
vpbroadcastb xmm2{k5}{z}, cx
vpbroadcastb xmm2{k5}{z}, ecx
vpbroadcastb xmm2{k5}{z}, rcx
vpbroadcastb ymm16, cl
vpbroadcastb ymm16, cx
vpbroadcastb ymm16, ecx
vpbroadcastb ymm16, rcx
vpbroadcastb ymm16{k5}, cl
vpbroadcastb ymm16{k5}, cx
vpbroadcastb ymm16{k5}, ecx
vpbroadcastb ymm16{k5}, rcx
vpbroadcastb ymm16{k5}{z}, cl
vpbroadcastb ymm16{k5}{z}, cx
vpbroadcastb ymm16{k5}{z}, ecx
vpbroadcastb ymm16{k5}{z}, rcx
vpbroadcastb zmm24, cl
vpbroadcastb zmm24, cx
vpbroadcastb zmm24, ecx
vpbroadcastb zmm24, rcx
vpbroadcastb zmm24{k5}, cl
vpbroadcastb zmm24{k5}, cx
vpbroadcastb zmm24{k5}, ecx
vpbroadcastb zmm24{k5}, rcx
vpbroadcastb zmm24{k5}{z}, cl
vpbroadcastb zmm24{k5}{z}, cx
vpbroadcastb zmm24{k5}{z}, ecx
vpbroadcastb zmm24{k5}{z}, rcx
vpbroadcastw xmm2, xmm0
vpbroadcastw xmm2, [rbx]
vpbroadcastw xmm2, [rbx+r11*8+256]
vpbroadcastw xmm2, [rbx+r11*8-256]
vpbroadcastw xmm2{k5}, xmm0
vpbroadcastw xmm2{k5}, [rbx]
vpbroadcastw xmm2{k5}, [rbx+r11*8+256]
vpbroadcastw xmm2{k5}, [rbx+r11*8-256]
vpbroadcastw xmm2{k5}{z}, xmm0
vpbroadcastw xmm2{k5}{z}, [rbx]
vpbroadcastw xmm2{k5}{z}, [rbx+r11*8+256]
vpbroadcastw xmm2{k5}{z}, [rbx+r11*8-256]
vpbroadcastw ymm16, xmm0
vpbroadcastw ymm16, [rbx]
vpbroadcastw ymm16, [rbx+r11*8+256]
vpbroadcastw ymm16, [rbx+r11*8-256]
vpbroadcastw ymm16{k5}, xmm0
vpbroadcastw ymm16{k5}, [rbx]
vpbroadcastw ymm16{k5}, [rbx+r11*8+256]
vpbroadcastw ymm16{k5}, [rbx+r11*8-256]
vpbroadcastw ymm16{k5}{z}, xmm0
vpbroadcastw ymm16{k5}{z}, [rbx]
vpbroadcastw ymm16{k5}{z}, [rbx+r11*8+256]
vpbroadcastw ymm16{k5}{z}, [rbx+r11*8-256]
vpbroadcastw zmm24, xmm0
vpbroadcastw zmm24, [rbx]
vpbroadcastw zmm24, [rbx+r11*8+256]
vpbroadcastw zmm24, [rbx+r11*8-256]
vpbroadcastw zmm24{k5}, xmm0
vpbroadcastw zmm24{k5}, [rbx]
vpbroadcastw zmm24{k5}, [rbx+r11*8+256]
vpbroadcastw zmm24{k5}, [rbx+r11*8-256]
vpbroadcastw zmm24{k5}{z}, xmm0
vpbroadcastw zmm24{k5}{z}, [rbx]
vpbroadcastw zmm24{k5}{z}, [rbx+r11*8+256]
vpbroadcastw zmm24{k5}{z}, [rbx+r11*8-256]
vpbroadcastw xmm2, cx
vpbroadcastw xmm2, ecx
vpbroadcastw xmm2, rcx
vpbroadcastw xmm2{k5}, cx
vpbroadcastw xmm2{k5}, ecx
vpbroadcastw xmm2{k5}, rcx
vpbroadcastw xmm2{k5}{z}, cx
vpbroadcastw xmm2{k5}{z}, ecx
vpbroadcastw xmm2{k5}{z}, rcx
vpbroadcastw ymm16, cx
vpbroadcastw ymm16, ecx
vpbroadcastw ymm16, rcx
vpbroadcastw ymm16{k5}, cx
vpbroadcastw ymm16{k5}, ecx
vpbroadcastw ymm16{k5}, rcx
vpbroadcastw ymm16{k5}{z}, cx
vpbroadcastw ymm16{k5}{z}, ecx
vpbroadcastw ymm16{k5}{z}, rcx
vpbroadcastw zmm24, cx
vpbroadcastw zmm24, ecx
vpbroadcastw zmm24, rcx
vpbroadcastw zmm24{k5}, cx
vpbroadcastw zmm24{k5}, ecx
vpbroadcastw zmm24{k5}, rcx
vpbroadcastw zmm24{k5}{z}, cx
vpbroadcastw zmm24{k5}{z}, ecx
vpbroadcastw zmm24{k5}{z}, rcx
vpcmpb k3, xmm7, xmm0, 10
vpcmpb k3, xmm7, [rbx], 10
vpcmpb k3, xmm7, [rbx+r11*8+256], 10
vpcmpb k3, xmm7, [rbx+r11*8-256], 10
vpcmpb k3, ymm13, ymm15, 10
vpcmpb k3, ymm13, [rbx], 10
vpcmpb k3, ymm13, [rbx+r11*8+256], 10
vpcmpb k3, ymm13, [rbx+r11*8-256], 10
vpcmpb k3, zmm24, zmm31, 10
vpcmpb k3, zmm24, [rbx], 10
vpcmpb k3, zmm24, [rbx+r11*8+256], 10
vpcmpb k3, zmm24, [rbx+r11*8-256], 10
vpcmpb k3{k5}, xmm7, xmm0, 10
vpcmpb k3{k5}, xmm7, [rbx], 10
vpcmpb k3{k5}, xmm7, [rbx+r11*8+256], 10
vpcmpb k3{k5}, xmm7, [rbx+r11*8-256], 10
vpcmpb k3{k5}, ymm13, ymm15, 10
vpcmpb k3{k5}, ymm13, [rbx], 10
vpcmpb k3{k5}, ymm13, [rbx+r11*8+256], 10
vpcmpb k3{k5}, ymm13, [rbx+r11*8-256], 10
vpcmpb k3{k5}, zmm24, zmm31, 10
vpcmpb k3{k5}, zmm24, [rbx], 10
vpcmpb k3{k5}, zmm24, [rbx+r11*8+256], 10
vpcmpb k3{k5}, zmm24, [rbx+r11*8-256], 10
vpcmpeqb k3, xmm7, xmm0
vpcmpeqb k3, xmm7, [rbx]
vpcmpeqb k3, xmm7, [rbx+r11*8+256]
vpcmpeqb k3, xmm7, [rbx+r11*8-256]
vpcmpeqb k3, ymm13, ymm15
vpcmpeqb k3, ymm13, [rbx]
vpcmpeqb k3, ymm13, [rbx+r11*8+256]
vpcmpeqb k3, ymm13, [rbx+r11*8-256]
vpcmpeqb k3, zmm24, zmm31
vpcmpeqb k3, zmm24, [rbx]
vpcmpeqb k3, zmm24, [rbx+r11*8+256]
vpcmpeqb k3, zmm24, [rbx+r11*8-256]
vpcmpeqb k3{k5}, xmm7, xmm0
vpcmpeqb k3{k5}, xmm7, [rbx]
vpcmpeqb k3{k5}, xmm7, [rbx+r11*8+256]
vpcmpeqb k3{k5}, xmm7, [rbx+r11*8-256]
vpcmpeqb k3{k5}, ymm13, ymm15
vpcmpeqb k3{k5}, ymm13, [rbx]
vpcmpeqb k3{k5}, ymm13, [rbx+r11*8+256]
vpcmpeqb k3{k5}, ymm13, [rbx+r11*8-256]
vpcmpeqb k3{k5}, zmm24, zmm31
vpcmpeqb k3{k5}, zmm24, [rbx]
vpcmpeqb k3{k5}, zmm24, [rbx+r11*8+256]
vpcmpeqb k3{k5}, zmm24, [rbx+r11*8-256]
vpcmpeqw k3, xmm7, xmm0
vpcmpeqw k3, xmm7, [rbx]
vpcmpeqw k3, xmm7, [rbx+r11*8+256]
vpcmpeqw k3, xmm7, [rbx+r11*8-256]
vpcmpeqw k3, ymm13, ymm15
vpcmpeqw k3, ymm13, [rbx]
vpcmpeqw k3, ymm13, [rbx+r11*8+256]
vpcmpeqw k3, ymm13, [rbx+r11*8-256]
vpcmpeqw k3, zmm24, zmm31
vpcmpeqw k3, zmm24, [rbx]
vpcmpeqw k3, zmm24, [rbx+r11*8+256]
vpcmpeqw k3, zmm24, [rbx+r11*8-256]
vpcmpeqw k3{k5}, xmm7, xmm0
vpcmpeqw k3{k5}, xmm7, [rbx]
vpcmpeqw k3{k5}, xmm7, [rbx+r11*8+256]
vpcmpeqw k3{k5}, xmm7, [rbx+r11*8-256]
vpcmpeqw k3{k5}, ymm13, ymm15
vpcmpeqw k3{k5}, ymm13, [rbx]
vpcmpeqw k3{k5}, ymm13, [rbx+r11*8+256]
vpcmpeqw k3{k5}, ymm13, [rbx+r11*8-256]
vpcmpeqw k3{k5}, zmm24, zmm31
vpcmpeqw k3{k5}, zmm24, [rbx]
vpcmpeqw k3{k5}, zmm24, [rbx+r11*8+256]
vpcmpeqw k3{k5}, zmm24, [rbx+r11*8-256]
vpcmpgtb k3, xmm7, xmm0
vpcmpgtb k3, xmm7, [rbx]
vpcmpgtb k3, xmm7, [rbx+r11*8+256]
vpcmpgtb k3, xmm7, [rbx+r11*8-256]
vpcmpgtb k3, ymm13, ymm15
vpcmpgtb k3, ymm13, [rbx]
vpcmpgtb k3, ymm13, [rbx+r11*8+256]
vpcmpgtb k3, ymm13, [rbx+r11*8-256]
vpcmpgtb k3, zmm24, zmm31
vpcmpgtb k3, zmm24, [rbx]
vpcmpgtb k3, zmm24, [rbx+r11*8+256]
vpcmpgtb k3, zmm24, [rbx+r11*8-256]
vpcmpgtb k3{k5}, xmm7, xmm0
vpcmpgtb k3{k5}, xmm7, [rbx]
vpcmpgtb k3{k5}, xmm7, [rbx+r11*8+256]
vpcmpgtb k3{k5}, xmm7, [rbx+r11*8-256]
vpcmpgtb k3{k5}, ymm13, ymm15
vpcmpgtb k3{k5}, ymm13, [rbx]
vpcmpgtb k3{k5}, ymm13, [rbx+r11*8+256]
vpcmpgtb k3{k5}, ymm13, [rbx+r11*8-256]
vpcmpgtb k3{k5}, zmm24, zmm31
vpcmpgtb k3{k5}, zmm24, [rbx]
vpcmpgtb k3{k5}, zmm24, [rbx+r11*8+256]
vpcmpgtb k3{k5}, zmm24, [rbx+r11*8-256]
vpcmpgtw k3, xmm7, xmm0
vpcmpgtw k3, xmm7, [rbx]
vpcmpgtw k3, xmm7, [rbx+r11*8+256]
vpcmpgtw k3, xmm7, [rbx+r11*8-256]
vpcmpgtw k3, ymm13, ymm15
vpcmpgtw k3, ymm13, [rbx]
vpcmpgtw k3, ymm13, [rbx+r11*8+256]
vpcmpgtw k3, ymm13, [rbx+r11*8-256]
vpcmpgtw k3, zmm24, zmm31
vpcmpgtw k3, zmm24, [rbx]
vpcmpgtw k3, zmm24, [rbx+r11*8+256]
vpcmpgtw k3, zmm24, [rbx+r11*8-256]
vpcmpgtw k3{k5}, xmm7, xmm0
vpcmpgtw k3{k5}, xmm7, [rbx]
vpcmpgtw k3{k5}, xmm7, [rbx+r11*8+256]
vpcmpgtw k3{k5}, xmm7, [rbx+r11*8-256]
vpcmpgtw k3{k5}, ymm13, ymm15
vpcmpgtw k3{k5}, ymm13, [rbx]
vpcmpgtw k3{k5}, ymm13, [rbx+r11*8+256]
vpcmpgtw k3{k5}, ymm13, [rbx+r11*8-256]
vpcmpgtw k3{k5}, zmm24, zmm31
vpcmpgtw k3{k5}, zmm24, [rbx]
vpcmpgtw k3{k5}, zmm24, [rbx+r11*8+256]
vpcmpgtw k3{k5}, zmm24, [rbx+r11*8-256]
vpcmpub k3, xmm7, xmm0, 10
vpcmpub k3, xmm7, [rbx], 10
vpcmpub k3, xmm7, [rbx+r11*8+256], 10
vpcmpub k3, xmm7, [rbx+r11*8-256], 10
vpcmpub k3, ymm13, ymm15, 10
vpcmpub k3, ymm13, [rbx], 10
vpcmpub k3, ymm13, [rbx+r11*8+256], 10
vpcmpub k3, ymm13, [rbx+r11*8-256], 10
vpcmpub k3, zmm24, zmm31, 10
vpcmpub k3, zmm24, [rbx], 10
vpcmpub k3, zmm24, [rbx+r11*8+256], 10
vpcmpub k3, zmm24, [rbx+r11*8-256], 10
vpcmpub k3{k5}, xmm7, xmm0, 10
vpcmpub k3{k5}, xmm7, [rbx], 10
vpcmpub k3{k5}, xmm7, [rbx+r11*8+256], 10
vpcmpub k3{k5}, xmm7, [rbx+r11*8-256], 10
vpcmpub k3{k5}, ymm13, ymm15, 10
vpcmpub k3{k5}, ymm13, [rbx], 10
vpcmpub k3{k5}, ymm13, [rbx+r11*8+256], 10
vpcmpub k3{k5}, ymm13, [rbx+r11*8-256], 10
vpcmpub k3{k5}, zmm24, zmm31, 10
vpcmpub k3{k5}, zmm24, [rbx], 10
vpcmpub k3{k5}, zmm24, [rbx+r11*8+256], 10
vpcmpub k3{k5}, zmm24, [rbx+r11*8-256], 10
vpcmpuw k3, xmm7, xmm0, 10
vpcmpuw k3, xmm7, [rbx], 10
vpcmpuw k3, xmm7, [rbx+r11*8+256], 10
vpcmpuw k3, xmm7, [rbx+r11*8-256], 10
vpcmpuw k3, ymm13, ymm15, 10
vpcmpuw k3, ymm13, [rbx], 10
vpcmpuw k3, ymm13, [rbx+r11*8+256], 10
vpcmpuw k3, ymm13, [rbx+r11*8-256], 10
vpcmpuw k3, zmm24, zmm31, 10
vpcmpuw k3, zmm24, [rbx], 10
vpcmpuw k3, zmm24, [rbx+r11*8+256], 10
vpcmpuw k3, zmm24, [rbx+r11*8-256], 10
vpcmpuw k3{k5}, xmm7, xmm0, 10
vpcmpuw k3{k5}, xmm7, [rbx], 10
vpcmpuw k3{k5}, xmm7, [rbx+r11*8+256], 10
vpcmpuw k3{k5}, xmm7, [rbx+r11*8-256], 10
vpcmpuw k3{k5}, ymm13, ymm15, 10
vpcmpuw k3{k5}, ymm13, [rbx], 10
vpcmpuw k3{k5}, ymm13, [rbx+r11*8+256], 10
vpcmpuw k3{k5}, ymm13, [rbx+r11*8-256], 10
vpcmpuw k3{k5}, zmm24, zmm31, 10
vpcmpuw k3{k5}, zmm24, [rbx], 10
vpcmpuw k3{k5}, zmm24, [rbx+r11*8+256], 10
vpcmpuw k3{k5}, zmm24, [rbx+r11*8-256], 10
vpcmpw k3, xmm7, xmm0, 10
vpcmpw k3, xmm7, [rbx], 10
vpcmpw k3, xmm7, [rbx+r11*8+256], 10
vpcmpw k3, xmm7, [rbx+r11*8-256], 10
vpcmpw k3, ymm13, ymm15, 10
vpcmpw k3, ymm13, [rbx], 10
vpcmpw k3, ymm13, [rbx+r11*8+256], 10
vpcmpw k3, ymm13, [rbx+r11*8-256], 10
vpcmpw k3, zmm24, zmm31, 10
vpcmpw k3, zmm24, [rbx], 10
vpcmpw k3, zmm24, [rbx+r11*8+256], 10
vpcmpw k3, zmm24, [rbx+r11*8-256], 10
vpcmpw k3{k5}, xmm7, xmm0, 10
vpcmpw k3{k5}, xmm7, [rbx], 10
vpcmpw k3{k5}, xmm7, [rbx+r11*8+256], 10
vpcmpw k3{k5}, xmm7, [rbx+r11*8-256], 10
vpcmpw k3{k5}, ymm13, ymm15, 10
vpcmpw k3{k5}, ymm13, [rbx], 10
vpcmpw k3{k5}, ymm13, [rbx+r11*8+256], 10
vpcmpw k3{k5}, ymm13, [rbx+r11*8-256], 10
vpcmpw k3{k5}, zmm24, zmm31, 10
vpcmpw k3{k5}, zmm24, [rbx], 10
vpcmpw k3{k5}, zmm24, [rbx+r11*8+256], 10
vpcmpw k3{k5}, zmm24, [rbx+r11*8-256], 10
vpermi2w xmm2, xmm7, xmm0
vpermi2w xmm2, xmm7, [rbx]
vpermi2w xmm2, xmm7, [rbx+r11*8+256]
vpermi2w xmm2, xmm7, [rbx+r11*8-256]
vpermi2w xmm2{k5}, xmm7, xmm0
vpermi2w xmm2{k5}, xmm7, [rbx]
vpermi2w xmm2{k5}, xmm7, [rbx+r11*8+256]
vpermi2w xmm2{k5}, xmm7, [rbx+r11*8-256]
vpermi2w xmm2{k5}{z}, xmm7, xmm0
vpermi2w xmm2{k5}{z}, xmm7, [rbx]
vpermi2w xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpermi2w xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpermi2w ymm16, ymm13, ymm15
vpermi2w ymm16, ymm13, [rbx]
vpermi2w ymm16, ymm13, [rbx+r11*8+256]
vpermi2w ymm16, ymm13, [rbx+r11*8-256]
vpermi2w ymm16{k5}, ymm13, ymm15
vpermi2w ymm16{k5}, ymm13, [rbx]
vpermi2w ymm16{k5}, ymm13, [rbx+r11*8+256]
vpermi2w ymm16{k5}, ymm13, [rbx+r11*8-256]
vpermi2w ymm16{k5}{z}, ymm13, ymm15
vpermi2w ymm16{k5}{z}, ymm13, [rbx]
vpermi2w ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpermi2w ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpermi2w zmm24, zmm24, zmm31
vpermi2w zmm24, zmm24, [rbx]
vpermi2w zmm24, zmm24, [rbx+r11*8+256]
vpermi2w zmm24, zmm24, [rbx+r11*8-256]
vpermi2w zmm24{k5}, zmm24, zmm31
vpermi2w zmm24{k5}, zmm24, [rbx]
vpermi2w zmm24{k5}, zmm24, [rbx+r11*8+256]
vpermi2w zmm24{k5}, zmm24, [rbx+r11*8-256]
vpermi2w zmm24{k5}{z}, zmm24, zmm31
vpermi2w zmm24{k5}{z}, zmm24, [rbx]
vpermi2w zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpermi2w zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpermt2w xmm2, xmm7, xmm0
vpermt2w xmm2, xmm7, [rbx]
vpermt2w xmm2, xmm7, [rbx+r11*8+256]
vpermt2w xmm2, xmm7, [rbx+r11*8-256]
vpermt2w xmm2{k5}, xmm7, xmm0
vpermt2w xmm2{k5}, xmm7, [rbx]
vpermt2w xmm2{k5}, xmm7, [rbx+r11*8+256]
vpermt2w xmm2{k5}, xmm7, [rbx+r11*8-256]
vpermt2w xmm2{k5}{z}, xmm7, xmm0
vpermt2w xmm2{k5}{z}, xmm7, [rbx]
vpermt2w xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpermt2w xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpermt2w ymm16, ymm13, ymm15
vpermt2w ymm16, ymm13, [rbx]
vpermt2w ymm16, ymm13, [rbx+r11*8+256]
vpermt2w ymm16, ymm13, [rbx+r11*8-256]
vpermt2w ymm16{k5}, ymm13, ymm15
vpermt2w ymm16{k5}, ymm13, [rbx]
vpermt2w ymm16{k5}, ymm13, [rbx+r11*8+256]
vpermt2w ymm16{k5}, ymm13, [rbx+r11*8-256]
vpermt2w ymm16{k5}{z}, ymm13, ymm15
vpermt2w ymm16{k5}{z}, ymm13, [rbx]
vpermt2w ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpermt2w ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpermt2w zmm24, zmm24, zmm31
vpermt2w zmm24, zmm24, [rbx]
vpermt2w zmm24, zmm24, [rbx+r11*8+256]
vpermt2w zmm24, zmm24, [rbx+r11*8-256]
vpermt2w zmm24{k5}, zmm24, zmm31
vpermt2w zmm24{k5}, zmm24, [rbx]
vpermt2w zmm24{k5}, zmm24, [rbx+r11*8+256]
vpermt2w zmm24{k5}, zmm24, [rbx+r11*8-256]
vpermt2w zmm24{k5}{z}, zmm24, zmm31
vpermt2w zmm24{k5}{z}, zmm24, [rbx]
vpermt2w zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpermt2w zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpermw xmm2, xmm7, xmm0
vpermw xmm2, xmm7, [rbx]
vpermw xmm2, xmm7, [rbx+r11*8+256]
vpermw xmm2, xmm7, [rbx+r11*8-256]
vpermw xmm2{k5}, xmm7, xmm0
vpermw xmm2{k5}, xmm7, [rbx]
vpermw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpermw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpermw xmm2{k5}{z}, xmm7, xmm0
vpermw xmm2{k5}{z}, xmm7, [rbx]
vpermw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpermw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpermw ymm16, ymm13, ymm15
vpermw ymm16, ymm13, [rbx]
vpermw ymm16, ymm13, [rbx+r11*8+256]
vpermw ymm16, ymm13, [rbx+r11*8-256]
vpermw ymm16{k5}, ymm13, ymm15
vpermw ymm16{k5}, ymm13, [rbx]
vpermw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpermw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpermw ymm16{k5}{z}, ymm13, ymm15
vpermw ymm16{k5}{z}, ymm13, [rbx]
vpermw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpermw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpermw zmm24, zmm24, zmm31
vpermw zmm24, zmm24, [rbx]
vpermw zmm24, zmm24, [rbx+r11*8+256]
vpermw zmm24, zmm24, [rbx+r11*8-256]
vpermw zmm24{k5}, zmm24, zmm31
vpermw zmm24{k5}, zmm24, [rbx]
vpermw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpermw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpermw zmm24{k5}{z}, zmm24, zmm31
vpermw zmm24{k5}{z}, zmm24, [rbx]
vpermw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpermw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpextrb [rbx], xmm2, 10
vpextrb [rbx+rsi*8+256], xmm2, 10
vpextrb [rbx+rsi*8-256], xmm2, 10
vpextrb cl, xmm2, 10
vpextrb cx, xmm2, 10
vpextrb ecx, xmm2, 10
vpextrb rcx, xmm2, 10
vpextrw cx, xmm0, 10
vpextrw ecx, xmm0, 10
vpextrw rcx, xmm0, 10
vpextrw [rbx], xmm2, 10
vpextrw [rbx+rsi*8+256], xmm2, 10
vpextrw [rbx+rsi*8-256], xmm2, 10
vpextrw cx, xmm2, 10
vpextrw ecx, xmm2, 10
vpextrw rcx, xmm2, 10
vpinsrb xmm2, xmm7, [rbx], 10
vpinsrb xmm2, xmm7, [rbx+rsi*8+256], 10
vpinsrb xmm2, xmm7, [rbx+rsi*8-256], 10
vpinsrb xmm2, xmm7, cl, 10
vpinsrb xmm2, xmm7, ecx, 10
vpinsrw xmm2, xmm7, [rbx], 10
vpinsrw xmm2, xmm7, [rbx+rsi*8+256], 10
vpinsrw xmm2, xmm7, [rbx+rsi*8-256], 10
vpinsrw xmm2, xmm7, cx, 10
vpinsrw xmm2, xmm7, ecx, 10
vpmaddubsw xmm2, xmm7, xmm0
vpmaddubsw xmm2, xmm7, [rbx]
vpmaddubsw xmm2, xmm7, [rbx+r11*8+256]
vpmaddubsw xmm2, xmm7, [rbx+r11*8-256]
vpmaddubsw xmm2{k5}, xmm7, xmm0
vpmaddubsw xmm2{k5}, xmm7, [rbx]
vpmaddubsw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmaddubsw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmaddubsw xmm2{k5}{z}, xmm7, xmm0
vpmaddubsw xmm2{k5}{z}, xmm7, [rbx]
vpmaddubsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmaddubsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmaddubsw ymm16, ymm13, ymm15
vpmaddubsw ymm16, ymm13, [rbx]
vpmaddubsw ymm16, ymm13, [rbx+r11*8+256]
vpmaddubsw ymm16, ymm13, [rbx+r11*8-256]
vpmaddubsw ymm16{k5}, ymm13, ymm15
vpmaddubsw ymm16{k5}, ymm13, [rbx]
vpmaddubsw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmaddubsw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmaddubsw ymm16{k5}{z}, ymm13, ymm15
vpmaddubsw ymm16{k5}{z}, ymm13, [rbx]
vpmaddubsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmaddubsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmaddubsw zmm24, zmm24, zmm31
vpmaddubsw zmm24, zmm24, [rbx]
vpmaddubsw zmm24, zmm24, [rbx+r11*8+256]
vpmaddubsw zmm24, zmm24, [rbx+r11*8-256]
vpmaddubsw zmm24{k5}, zmm24, zmm31
vpmaddubsw zmm24{k5}, zmm24, [rbx]
vpmaddubsw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmaddubsw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmaddubsw zmm24{k5}{z}, zmm24, zmm31
vpmaddubsw zmm24{k5}{z}, zmm24, [rbx]
vpmaddubsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmaddubsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpmaddwd xmm2, xmm7, xmm0
vpmaddwd xmm2, xmm7, [rbx]
vpmaddwd xmm2, xmm7, [rbx+r11*8+256]
vpmaddwd xmm2, xmm7, [rbx+r11*8-256]
vpmaddwd xmm2{k5}, xmm7, xmm0
vpmaddwd xmm2{k5}, xmm7, [rbx]
vpmaddwd xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmaddwd xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmaddwd xmm2{k5}{z}, xmm7, xmm0
vpmaddwd xmm2{k5}{z}, xmm7, [rbx]
vpmaddwd xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmaddwd xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmaddwd ymm16, ymm13, ymm15
vpmaddwd ymm16, ymm13, [rbx]
vpmaddwd ymm16, ymm13, [rbx+r11*8+256]
vpmaddwd ymm16, ymm13, [rbx+r11*8-256]
vpmaddwd ymm16{k5}, ymm13, ymm15
vpmaddwd ymm16{k5}, ymm13, [rbx]
vpmaddwd ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmaddwd ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmaddwd ymm16{k5}{z}, ymm13, ymm15
vpmaddwd ymm16{k5}{z}, ymm13, [rbx]
vpmaddwd ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmaddwd ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmaddwd zmm24, zmm24, zmm31
vpmaddwd zmm24, zmm24, [rbx]
vpmaddwd zmm24, zmm24, [rbx+r11*8+256]
vpmaddwd zmm24, zmm24, [rbx+r11*8-256]
vpmaddwd zmm24{k5}, zmm24, zmm31
vpmaddwd zmm24{k5}, zmm24, [rbx]
vpmaddwd zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmaddwd zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmaddwd zmm24{k5}{z}, zmm24, zmm31
vpmaddwd zmm24{k5}{z}, zmm24, [rbx]
vpmaddwd zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmaddwd zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpmaxsb xmm2, xmm7, xmm0
vpmaxsb xmm2, xmm7, [rbx]
vpmaxsb xmm2, xmm7, [rbx+r11*8+256]
vpmaxsb xmm2, xmm7, [rbx+r11*8-256]
vpmaxsb xmm2{k5}, xmm7, xmm0
vpmaxsb xmm2{k5}, xmm7, [rbx]
vpmaxsb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmaxsb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmaxsb xmm2{k5}{z}, xmm7, xmm0
vpmaxsb xmm2{k5}{z}, xmm7, [rbx]
vpmaxsb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmaxsb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmaxsb ymm16, ymm13, ymm15
vpmaxsb ymm16, ymm13, [rbx]
vpmaxsb ymm16, ymm13, [rbx+r11*8+256]
vpmaxsb ymm16, ymm13, [rbx+r11*8-256]
vpmaxsb ymm16{k5}, ymm13, ymm15
vpmaxsb ymm16{k5}, ymm13, [rbx]
vpmaxsb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmaxsb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmaxsb ymm16{k5}{z}, ymm13, ymm15
vpmaxsb ymm16{k5}{z}, ymm13, [rbx]
vpmaxsb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmaxsb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmaxsb zmm24, zmm24, zmm31
vpmaxsb zmm24, zmm24, [rbx]
vpmaxsb zmm24, zmm24, [rbx+r11*8+256]
vpmaxsb zmm24, zmm24, [rbx+r11*8-256]
vpmaxsb zmm24{k5}, zmm24, zmm31
vpmaxsb zmm24{k5}, zmm24, [rbx]
vpmaxsb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmaxsb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmaxsb zmm24{k5}{z}, zmm24, zmm31
vpmaxsb zmm24{k5}{z}, zmm24, [rbx]
vpmaxsb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmaxsb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpmaxsw xmm2, xmm7, xmm0
vpmaxsw xmm2, xmm7, [rbx]
vpmaxsw xmm2, xmm7, [rbx+r11*8+256]
vpmaxsw xmm2, xmm7, [rbx+r11*8-256]
vpmaxsw xmm2{k5}, xmm7, xmm0
vpmaxsw xmm2{k5}, xmm7, [rbx]
vpmaxsw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmaxsw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmaxsw xmm2{k5}{z}, xmm7, xmm0
vpmaxsw xmm2{k5}{z}, xmm7, [rbx]
vpmaxsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmaxsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmaxsw ymm16, ymm13, ymm15
vpmaxsw ymm16, ymm13, [rbx]
vpmaxsw ymm16, ymm13, [rbx+r11*8+256]
vpmaxsw ymm16, ymm13, [rbx+r11*8-256]
vpmaxsw ymm16{k5}, ymm13, ymm15
vpmaxsw ymm16{k5}, ymm13, [rbx]
vpmaxsw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmaxsw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmaxsw ymm16{k5}{z}, ymm13, ymm15
vpmaxsw ymm16{k5}{z}, ymm13, [rbx]
vpmaxsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmaxsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmaxsw zmm24, zmm24, zmm31
vpmaxsw zmm24, zmm24, [rbx]
vpmaxsw zmm24, zmm24, [rbx+r11*8+256]
vpmaxsw zmm24, zmm24, [rbx+r11*8-256]
vpmaxsw zmm24{k5}, zmm24, zmm31
vpmaxsw zmm24{k5}, zmm24, [rbx]
vpmaxsw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmaxsw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmaxsw zmm24{k5}{z}, zmm24, zmm31
vpmaxsw zmm24{k5}{z}, zmm24, [rbx]
vpmaxsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmaxsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpmaxub xmm2, xmm7, xmm0
vpmaxub xmm2, xmm7, [rbx]
vpmaxub xmm2, xmm7, [rbx+r11*8+256]
vpmaxub xmm2, xmm7, [rbx+r11*8-256]
vpmaxub xmm2{k5}, xmm7, xmm0
vpmaxub xmm2{k5}, xmm7, [rbx]
vpmaxub xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmaxub xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmaxub xmm2{k5}{z}, xmm7, xmm0
vpmaxub xmm2{k5}{z}, xmm7, [rbx]
vpmaxub xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmaxub xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmaxub ymm16, ymm13, ymm15
vpmaxub ymm16, ymm13, [rbx]
vpmaxub ymm16, ymm13, [rbx+r11*8+256]
vpmaxub ymm16, ymm13, [rbx+r11*8-256]
vpmaxub ymm16{k5}, ymm13, ymm15
vpmaxub ymm16{k5}, ymm13, [rbx]
vpmaxub ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmaxub ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmaxub ymm16{k5}{z}, ymm13, ymm15
vpmaxub ymm16{k5}{z}, ymm13, [rbx]
vpmaxub ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmaxub ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmaxub zmm24, zmm24, zmm31
vpmaxub zmm24, zmm24, [rbx]
vpmaxub zmm24, zmm24, [rbx+r11*8+256]
vpmaxub zmm24, zmm24, [rbx+r11*8-256]
vpmaxub zmm24{k5}, zmm24, zmm31
vpmaxub zmm24{k5}, zmm24, [rbx]
vpmaxub zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmaxub zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmaxub zmm24{k5}{z}, zmm24, zmm31
vpmaxub zmm24{k5}{z}, zmm24, [rbx]
vpmaxub zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmaxub zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpmaxuw xmm2, xmm7, xmm0
vpmaxuw xmm2, xmm7, [rbx]
vpmaxuw xmm2, xmm7, [rbx+r11*8+256]
vpmaxuw xmm2, xmm7, [rbx+r11*8-256]
vpmaxuw xmm2{k5}, xmm7, xmm0
vpmaxuw xmm2{k5}, xmm7, [rbx]
vpmaxuw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmaxuw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmaxuw xmm2{k5}{z}, xmm7, xmm0
vpmaxuw xmm2{k5}{z}, xmm7, [rbx]
vpmaxuw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmaxuw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmaxuw ymm16, ymm13, ymm15
vpmaxuw ymm16, ymm13, [rbx]
vpmaxuw ymm16, ymm13, [rbx+r11*8+256]
vpmaxuw ymm16, ymm13, [rbx+r11*8-256]
vpmaxuw ymm16{k5}, ymm13, ymm15
vpmaxuw ymm16{k5}, ymm13, [rbx]
vpmaxuw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmaxuw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmaxuw ymm16{k5}{z}, ymm13, ymm15
vpmaxuw ymm16{k5}{z}, ymm13, [rbx]
vpmaxuw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmaxuw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmaxuw zmm24, zmm24, zmm31
vpmaxuw zmm24, zmm24, [rbx]
vpmaxuw zmm24, zmm24, [rbx+r11*8+256]
vpmaxuw zmm24, zmm24, [rbx+r11*8-256]
vpmaxuw zmm24{k5}, zmm24, zmm31
vpmaxuw zmm24{k5}, zmm24, [rbx]
vpmaxuw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmaxuw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmaxuw zmm24{k5}{z}, zmm24, zmm31
vpmaxuw zmm24{k5}{z}, zmm24, [rbx]
vpmaxuw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmaxuw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpminsb xmm2, xmm7, xmm0
vpminsb xmm2, xmm7, [rbx]
vpminsb xmm2, xmm7, [rbx+r11*8+256]
vpminsb xmm2, xmm7, [rbx+r11*8-256]
vpminsb xmm2{k5}, xmm7, xmm0
vpminsb xmm2{k5}, xmm7, [rbx]
vpminsb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpminsb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpminsb xmm2{k5}{z}, xmm7, xmm0
vpminsb xmm2{k5}{z}, xmm7, [rbx]
vpminsb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpminsb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpminsb ymm16, ymm13, ymm15
vpminsb ymm16, ymm13, [rbx]
vpminsb ymm16, ymm13, [rbx+r11*8+256]
vpminsb ymm16, ymm13, [rbx+r11*8-256]
vpminsb ymm16{k5}, ymm13, ymm15
vpminsb ymm16{k5}, ymm13, [rbx]
vpminsb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpminsb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpminsb ymm16{k5}{z}, ymm13, ymm15
vpminsb ymm16{k5}{z}, ymm13, [rbx]
vpminsb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpminsb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpminsb zmm24, zmm24, zmm31
vpminsb zmm24, zmm24, [rbx]
vpminsb zmm24, zmm24, [rbx+r11*8+256]
vpminsb zmm24, zmm24, [rbx+r11*8-256]
vpminsb zmm24{k5}, zmm24, zmm31
vpminsb zmm24{k5}, zmm24, [rbx]
vpminsb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpminsb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpminsb zmm24{k5}{z}, zmm24, zmm31
vpminsb zmm24{k5}{z}, zmm24, [rbx]
vpminsb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpminsb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpminsw xmm2, xmm7, xmm0
vpminsw xmm2, xmm7, [rbx]
vpminsw xmm2, xmm7, [rbx+r11*8+256]
vpminsw xmm2, xmm7, [rbx+r11*8-256]
vpminsw xmm2{k5}, xmm7, xmm0
vpminsw xmm2{k5}, xmm7, [rbx]
vpminsw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpminsw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpminsw xmm2{k5}{z}, xmm7, xmm0
vpminsw xmm2{k5}{z}, xmm7, [rbx]
vpminsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpminsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpminsw ymm16, ymm13, ymm15
vpminsw ymm16, ymm13, [rbx]
vpminsw ymm16, ymm13, [rbx+r11*8+256]
vpminsw ymm16, ymm13, [rbx+r11*8-256]
vpminsw ymm16{k5}, ymm13, ymm15
vpminsw ymm16{k5}, ymm13, [rbx]
vpminsw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpminsw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpminsw ymm16{k5}{z}, ymm13, ymm15
vpminsw ymm16{k5}{z}, ymm13, [rbx]
vpminsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpminsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpminsw zmm24, zmm24, zmm31
vpminsw zmm24, zmm24, [rbx]
vpminsw zmm24, zmm24, [rbx+r11*8+256]
vpminsw zmm24, zmm24, [rbx+r11*8-256]
vpminsw zmm24{k5}, zmm24, zmm31
vpminsw zmm24{k5}, zmm24, [rbx]
vpminsw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpminsw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpminsw zmm24{k5}{z}, zmm24, zmm31
vpminsw zmm24{k5}{z}, zmm24, [rbx]
vpminsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpminsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpminub xmm2, xmm7, xmm0
vpminub xmm2, xmm7, [rbx]
vpminub xmm2, xmm7, [rbx+r11*8+256]
vpminub xmm2, xmm7, [rbx+r11*8-256]
vpminub xmm2{k5}, xmm7, xmm0
vpminub xmm2{k5}, xmm7, [rbx]
vpminub xmm2{k5}, xmm7, [rbx+r11*8+256]
vpminub xmm2{k5}, xmm7, [rbx+r11*8-256]
vpminub xmm2{k5}{z}, xmm7, xmm0
vpminub xmm2{k5}{z}, xmm7, [rbx]
vpminub xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpminub xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpminub ymm16, ymm13, ymm15
vpminub ymm16, ymm13, [rbx]
vpminub ymm16, ymm13, [rbx+r11*8+256]
vpminub ymm16, ymm13, [rbx+r11*8-256]
vpminub ymm16{k5}, ymm13, ymm15
vpminub ymm16{k5}, ymm13, [rbx]
vpminub ymm16{k5}, ymm13, [rbx+r11*8+256]
vpminub ymm16{k5}, ymm13, [rbx+r11*8-256]
vpminub ymm16{k5}{z}, ymm13, ymm15
vpminub ymm16{k5}{z}, ymm13, [rbx]
vpminub ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpminub ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpminub zmm24, zmm24, zmm31
vpminub zmm24, zmm24, [rbx]
vpminub zmm24, zmm24, [rbx+r11*8+256]
vpminub zmm24, zmm24, [rbx+r11*8-256]
vpminub zmm24{k5}, zmm24, zmm31
vpminub zmm24{k5}, zmm24, [rbx]
vpminub zmm24{k5}, zmm24, [rbx+r11*8+256]
vpminub zmm24{k5}, zmm24, [rbx+r11*8-256]
vpminub zmm24{k5}{z}, zmm24, zmm31
vpminub zmm24{k5}{z}, zmm24, [rbx]
vpminub zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpminub zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpminuw xmm2, xmm7, xmm0
vpminuw xmm2, xmm7, [rbx]
vpminuw xmm2, xmm7, [rbx+r11*8+256]
vpminuw xmm2, xmm7, [rbx+r11*8-256]
vpminuw xmm2{k5}, xmm7, xmm0
vpminuw xmm2{k5}, xmm7, [rbx]
vpminuw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpminuw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpminuw xmm2{k5}{z}, xmm7, xmm0
vpminuw xmm2{k5}{z}, xmm7, [rbx]
vpminuw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpminuw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpminuw ymm16, ymm13, ymm15
vpminuw ymm16, ymm13, [rbx]
vpminuw ymm16, ymm13, [rbx+r11*8+256]
vpminuw ymm16, ymm13, [rbx+r11*8-256]
vpminuw ymm16{k5}, ymm13, ymm15
vpminuw ymm16{k5}, ymm13, [rbx]
vpminuw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpminuw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpminuw ymm16{k5}{z}, ymm13, ymm15
vpminuw ymm16{k5}{z}, ymm13, [rbx]
vpminuw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpminuw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpminuw zmm24, zmm24, zmm31
vpminuw zmm24, zmm24, [rbx]
vpminuw zmm24, zmm24, [rbx+r11*8+256]
vpminuw zmm24, zmm24, [rbx+r11*8-256]
vpminuw zmm24{k5}, zmm24, zmm31
vpminuw zmm24{k5}, zmm24, [rbx]
vpminuw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpminuw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpminuw zmm24{k5}{z}, zmm24, zmm31
vpminuw zmm24{k5}{z}, zmm24, [rbx]
vpminuw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpminuw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpmovb2m k3, xmm0
vpmovb2m k3, ymm15
vpmovb2m k3, zmm31
vpmovm2b xmm2, k1
vpmovm2b ymm16, k1
vpmovm2b zmm24, k1
vpmovm2w xmm2, k1
vpmovm2w ymm16, k1
vpmovm2w zmm24, k1
vpmovswb xmm0, xmm2
vpmovswb xmm0, ymm16
vpmovswb ymm15, zmm24
vpmovswb [rbx], xmm2
vpmovswb [rbx], ymm16
vpmovswb [rbx], zmm24
vpmovswb [rbx+r11*8+256], xmm2
vpmovswb [rbx+r11*8+256], ymm16
vpmovswb [rbx+r11*8+256], zmm24
vpmovswb [rbx+r11*8-256], xmm2
vpmovswb [rbx+r11*8-256], ymm16
vpmovswb [rbx+r11*8-256], zmm24
vpmovsxbw xmm2, xmm0
vpmovsxbw xmm2, [rbx]
vpmovsxbw xmm2, [rbx+r11*8+256]
vpmovsxbw xmm2, [rbx+r11*8-256]
vpmovsxbw xmm2{k5}, xmm0
vpmovsxbw xmm2{k5}, [rbx]
vpmovsxbw xmm2{k5}, [rbx+r11*8+256]
vpmovsxbw xmm2{k5}, [rbx+r11*8-256]
vpmovsxbw xmm2{k5}{z}, xmm0
vpmovsxbw xmm2{k5}{z}, [rbx]
vpmovsxbw xmm2{k5}{z}, [rbx+r11*8+256]
vpmovsxbw xmm2{k5}{z}, [rbx+r11*8-256]
vpmovsxbw ymm16, xmm0
vpmovsxbw ymm16, [rbx]
vpmovsxbw ymm16, [rbx+r11*8+256]
vpmovsxbw ymm16, [rbx+r11*8-256]
vpmovsxbw ymm16{k5}, xmm0
vpmovsxbw ymm16{k5}, [rbx]
vpmovsxbw ymm16{k5}, [rbx+r11*8+256]
vpmovsxbw ymm16{k5}, [rbx+r11*8-256]
vpmovsxbw ymm16{k5}{z}, xmm0
vpmovsxbw ymm16{k5}{z}, [rbx]
vpmovsxbw ymm16{k5}{z}, [rbx+r11*8+256]
vpmovsxbw ymm16{k5}{z}, [rbx+r11*8-256]
vpmovsxbw zmm24, ymm15
vpmovsxbw zmm24, [rbx]
vpmovsxbw zmm24, [rbx+r11*8+256]
vpmovsxbw zmm24, [rbx+r11*8-256]
vpmovsxbw zmm24{k5}, ymm15
vpmovsxbw zmm24{k5}, [rbx]
vpmovsxbw zmm24{k5}, [rbx+r11*8+256]
vpmovsxbw zmm24{k5}, [rbx+r11*8-256]
vpmovsxbw zmm24{k5}{z}, ymm15
vpmovsxbw zmm24{k5}{z}, [rbx]
vpmovsxbw zmm24{k5}{z}, [rbx+r11*8+256]
vpmovsxbw zmm24{k5}{z}, [rbx+r11*8-256]
vpmovuswb xmm0, xmm2
vpmovuswb xmm0, ymm16
vpmovuswb ymm15, zmm24
vpmovuswb [rbx], xmm2
vpmovuswb [rbx], ymm16
vpmovuswb [rbx], zmm24
vpmovuswb [rbx+r11*8+256], xmm2
vpmovuswb [rbx+r11*8+256], ymm16
vpmovuswb [rbx+r11*8+256], zmm24
vpmovuswb [rbx+r11*8-256], xmm2
vpmovuswb [rbx+r11*8-256], ymm16
vpmovuswb [rbx+r11*8-256], zmm24
vpmovw2m k3, xmm0
vpmovw2m k3, ymm15
vpmovw2m k3, zmm31
vpmovwb xmm0, xmm2
vpmovwb xmm0, ymm16
vpmovwb ymm15, zmm24
vpmovwb [rbx], xmm2
vpmovwb [rbx], ymm16
vpmovwb [rbx], zmm24
vpmovwb [rbx+r11*8+256], xmm2
vpmovwb [rbx+r11*8+256], ymm16
vpmovwb [rbx+r11*8+256], zmm24
vpmovwb [rbx+r11*8-256], xmm2
vpmovwb [rbx+r11*8-256], ymm16
vpmovwb [rbx+r11*8-256], zmm24
vpmovzxbw xmm2, xmm0
vpmovzxbw xmm2, [rbx]
vpmovzxbw xmm2, [rbx+r11*8+256]
vpmovzxbw xmm2, [rbx+r11*8-256]
vpmovzxbw xmm2{k5}, xmm0
vpmovzxbw xmm2{k5}, [rbx]
vpmovzxbw xmm2{k5}, [rbx+r11*8+256]
vpmovzxbw xmm2{k5}, [rbx+r11*8-256]
vpmovzxbw xmm2{k5}{z}, xmm0
vpmovzxbw xmm2{k5}{z}, [rbx]
vpmovzxbw xmm2{k5}{z}, [rbx+r11*8+256]
vpmovzxbw xmm2{k5}{z}, [rbx+r11*8-256]
vpmovzxbw ymm16, xmm0
vpmovzxbw ymm16, [rbx]
vpmovzxbw ymm16, [rbx+r11*8+256]
vpmovzxbw ymm16, [rbx+r11*8-256]
vpmovzxbw ymm16{k5}, xmm0
vpmovzxbw ymm16{k5}, [rbx]
vpmovzxbw ymm16{k5}, [rbx+r11*8+256]
vpmovzxbw ymm16{k5}, [rbx+r11*8-256]
vpmovzxbw ymm16{k5}{z}, xmm0
vpmovzxbw ymm16{k5}{z}, [rbx]
vpmovzxbw ymm16{k5}{z}, [rbx+r11*8+256]
vpmovzxbw ymm16{k5}{z}, [rbx+r11*8-256]
vpmovzxbw zmm24, ymm15
vpmovzxbw zmm24, [rbx]
vpmovzxbw zmm24, [rbx+r11*8+256]
vpmovzxbw zmm24, [rbx+r11*8-256]
vpmovzxbw zmm24{k5}, ymm15
vpmovzxbw zmm24{k5}, [rbx]
vpmovzxbw zmm24{k5}, [rbx+r11*8+256]
vpmovzxbw zmm24{k5}, [rbx+r11*8-256]
vpmovzxbw zmm24{k5}{z}, ymm15
vpmovzxbw zmm24{k5}{z}, [rbx]
vpmovzxbw zmm24{k5}{z}, [rbx+r11*8+256]
vpmovzxbw zmm24{k5}{z}, [rbx+r11*8-256]
vpmulhrsw xmm2, xmm7, xmm0
vpmulhrsw xmm2, xmm7, [rbx]
vpmulhrsw xmm2, xmm7, [rbx+r11*8+256]
vpmulhrsw xmm2, xmm7, [rbx+r11*8-256]
vpmulhrsw xmm2{k5}, xmm7, xmm0
vpmulhrsw xmm2{k5}, xmm7, [rbx]
vpmulhrsw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmulhrsw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmulhrsw xmm2{k5}{z}, xmm7, xmm0
vpmulhrsw xmm2{k5}{z}, xmm7, [rbx]
vpmulhrsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmulhrsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmulhrsw ymm16, ymm13, ymm15
vpmulhrsw ymm16, ymm13, [rbx]
vpmulhrsw ymm16, ymm13, [rbx+r11*8+256]
vpmulhrsw ymm16, ymm13, [rbx+r11*8-256]
vpmulhrsw ymm16{k5}, ymm13, ymm15
vpmulhrsw ymm16{k5}, ymm13, [rbx]
vpmulhrsw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmulhrsw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmulhrsw ymm16{k5}{z}, ymm13, ymm15
vpmulhrsw ymm16{k5}{z}, ymm13, [rbx]
vpmulhrsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmulhrsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmulhrsw zmm24, zmm24, zmm31
vpmulhrsw zmm24, zmm24, [rbx]
vpmulhrsw zmm24, zmm24, [rbx+r11*8+256]
vpmulhrsw zmm24, zmm24, [rbx+r11*8-256]
vpmulhrsw zmm24{k5}, zmm24, zmm31
vpmulhrsw zmm24{k5}, zmm24, [rbx]
vpmulhrsw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmulhrsw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmulhrsw zmm24{k5}{z}, zmm24, zmm31
vpmulhrsw zmm24{k5}{z}, zmm24, [rbx]
vpmulhrsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmulhrsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpmulhuw xmm2, xmm7, xmm0
vpmulhuw xmm2, xmm7, [rbx]
vpmulhuw xmm2, xmm7, [rbx+r11*8+256]
vpmulhuw xmm2, xmm7, [rbx+r11*8-256]
vpmulhuw xmm2{k5}, xmm7, xmm0
vpmulhuw xmm2{k5}, xmm7, [rbx]
vpmulhuw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmulhuw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmulhuw xmm2{k5}{z}, xmm7, xmm0
vpmulhuw xmm2{k5}{z}, xmm7, [rbx]
vpmulhuw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmulhuw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmulhuw ymm16, ymm13, ymm15
vpmulhuw ymm16, ymm13, [rbx]
vpmulhuw ymm16, ymm13, [rbx+r11*8+256]
vpmulhuw ymm16, ymm13, [rbx+r11*8-256]
vpmulhuw ymm16{k5}, ymm13, ymm15
vpmulhuw ymm16{k5}, ymm13, [rbx]
vpmulhuw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmulhuw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmulhuw ymm16{k5}{z}, ymm13, ymm15
vpmulhuw ymm16{k5}{z}, ymm13, [rbx]
vpmulhuw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmulhuw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmulhuw zmm24, zmm24, zmm31
vpmulhuw zmm24, zmm24, [rbx]
vpmulhuw zmm24, zmm24, [rbx+r11*8+256]
vpmulhuw zmm24, zmm24, [rbx+r11*8-256]
vpmulhuw zmm24{k5}, zmm24, zmm31
vpmulhuw zmm24{k5}, zmm24, [rbx]
vpmulhuw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmulhuw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmulhuw zmm24{k5}{z}, zmm24, zmm31
vpmulhuw zmm24{k5}{z}, zmm24, [rbx]
vpmulhuw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmulhuw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpmulhw xmm2, xmm7, xmm0
vpmulhw xmm2, xmm7, [rbx]
vpmulhw xmm2, xmm7, [rbx+r11*8+256]
vpmulhw xmm2, xmm7, [rbx+r11*8-256]
vpmulhw xmm2{k5}, xmm7, xmm0
vpmulhw xmm2{k5}, xmm7, [rbx]
vpmulhw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmulhw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmulhw xmm2{k5}{z}, xmm7, xmm0
vpmulhw xmm2{k5}{z}, xmm7, [rbx]
vpmulhw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmulhw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmulhw ymm16, ymm13, ymm15
vpmulhw ymm16, ymm13, [rbx]
vpmulhw ymm16, ymm13, [rbx+r11*8+256]
vpmulhw ymm16, ymm13, [rbx+r11*8-256]
vpmulhw ymm16{k5}, ymm13, ymm15
vpmulhw ymm16{k5}, ymm13, [rbx]
vpmulhw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmulhw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmulhw ymm16{k5}{z}, ymm13, ymm15
vpmulhw ymm16{k5}{z}, ymm13, [rbx]
vpmulhw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmulhw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmulhw zmm24, zmm24, zmm31
vpmulhw zmm24, zmm24, [rbx]
vpmulhw zmm24, zmm24, [rbx+r11*8+256]
vpmulhw zmm24, zmm24, [rbx+r11*8-256]
vpmulhw zmm24{k5}, zmm24, zmm31
vpmulhw zmm24{k5}, zmm24, [rbx]
vpmulhw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmulhw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmulhw zmm24{k5}{z}, zmm24, zmm31
vpmulhw zmm24{k5}{z}, zmm24, [rbx]
vpmulhw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmulhw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpmullw xmm2, xmm7, xmm0
vpmullw xmm2, xmm7, [rbx]
vpmullw xmm2, xmm7, [rbx+r11*8+256]
vpmullw xmm2, xmm7, [rbx+r11*8-256]
vpmullw xmm2{k5}, xmm7, xmm0
vpmullw xmm2{k5}, xmm7, [rbx]
vpmullw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpmullw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpmullw xmm2{k5}{z}, xmm7, xmm0
vpmullw xmm2{k5}{z}, xmm7, [rbx]
vpmullw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpmullw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpmullw ymm16, ymm13, ymm15
vpmullw ymm16, ymm13, [rbx]
vpmullw ymm16, ymm13, [rbx+r11*8+256]
vpmullw ymm16, ymm13, [rbx+r11*8-256]
vpmullw ymm16{k5}, ymm13, ymm15
vpmullw ymm16{k5}, ymm13, [rbx]
vpmullw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpmullw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpmullw ymm16{k5}{z}, ymm13, ymm15
vpmullw ymm16{k5}{z}, ymm13, [rbx]
vpmullw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpmullw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpmullw zmm24, zmm24, zmm31
vpmullw zmm24, zmm24, [rbx]
vpmullw zmm24, zmm24, [rbx+r11*8+256]
vpmullw zmm24, zmm24, [rbx+r11*8-256]
vpmullw zmm24{k5}, zmm24, zmm31
vpmullw zmm24{k5}, zmm24, [rbx]
vpmullw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpmullw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpmullw zmm24{k5}{z}, zmm24, zmm31
vpmullw zmm24{k5}{z}, zmm24, [rbx]
vpmullw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpmullw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsadbw xmm2, xmm7, xmm0
vpsadbw xmm2, xmm7, [rbx]
vpsadbw xmm2, xmm7, [rbx+r11*8+256]
vpsadbw xmm2, xmm7, [rbx+r11*8-256]
vpsadbw ymm16, ymm13, ymm15
vpsadbw ymm16, ymm13, [rbx]
vpsadbw ymm16, ymm13, [rbx+r11*8+256]
vpsadbw ymm16, ymm13, [rbx+r11*8-256]
vpsadbw zmm24, zmm24, zmm31
vpsadbw zmm24, zmm24, [rbx]
vpsadbw zmm24, zmm24, [rbx+r11*8+256]
vpsadbw zmm24, zmm24, [rbx+r11*8-256]
vpshufb xmm2, xmm7, xmm0
vpshufb xmm2, xmm7, [rbx]
vpshufb xmm2, xmm7, [rbx+r11*8+256]
vpshufb xmm2, xmm7, [rbx+r11*8-256]
vpshufb xmm2{k5}, xmm7, xmm0
vpshufb xmm2{k5}, xmm7, [rbx]
vpshufb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpshufb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpshufb xmm2{k5}{z}, xmm7, xmm0
vpshufb xmm2{k5}{z}, xmm7, [rbx]
vpshufb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpshufb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpshufb ymm16, ymm13, ymm15
vpshufb ymm16, ymm13, [rbx]
vpshufb ymm16, ymm13, [rbx+r11*8+256]
vpshufb ymm16, ymm13, [rbx+r11*8-256]
vpshufb ymm16{k5}, ymm13, ymm15
vpshufb ymm16{k5}, ymm13, [rbx]
vpshufb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpshufb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpshufb ymm16{k5}{z}, ymm13, ymm15
vpshufb ymm16{k5}{z}, ymm13, [rbx]
vpshufb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpshufb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpshufb zmm24, zmm24, zmm31
vpshufb zmm24, zmm24, [rbx]
vpshufb zmm24, zmm24, [rbx+r11*8+256]
vpshufb zmm24, zmm24, [rbx+r11*8-256]
vpshufb zmm24{k5}, zmm24, zmm31
vpshufb zmm24{k5}, zmm24, [rbx]
vpshufb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpshufb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpshufb zmm24{k5}{z}, zmm24, zmm31
vpshufb zmm24{k5}{z}, zmm24, [rbx]
vpshufb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpshufb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpshufhw xmm2, xmm0, 10
vpshufhw xmm2, [rbx], 10
vpshufhw xmm2, [rbx+r11*8+256], 10
vpshufhw xmm2, [rbx+r11*8-256], 10
vpshufhw xmm2{k5}, xmm0, 10
vpshufhw xmm2{k5}, [rbx], 10
vpshufhw xmm2{k5}, [rbx+r11*8+256], 10
vpshufhw xmm2{k5}, [rbx+r11*8-256], 10
vpshufhw xmm2{k5}{z}, xmm0, 10
vpshufhw xmm2{k5}{z}, [rbx], 10
vpshufhw xmm2{k5}{z}, [rbx+r11*8+256], 10
vpshufhw xmm2{k5}{z}, [rbx+r11*8-256], 10
vpshufhw ymm16, ymm15, 10
vpshufhw ymm16, [rbx], 10
vpshufhw ymm16, [rbx+r11*8+256], 10
vpshufhw ymm16, [rbx+r11*8-256], 10
vpshufhw ymm16{k5}, ymm15, 10
vpshufhw ymm16{k5}, [rbx], 10
vpshufhw ymm16{k5}, [rbx+r11*8+256], 10
vpshufhw ymm16{k5}, [rbx+r11*8-256], 10
vpshufhw ymm16{k5}{z}, ymm15, 10
vpshufhw ymm16{k5}{z}, [rbx], 10
vpshufhw ymm16{k5}{z}, [rbx+r11*8+256], 10
vpshufhw ymm16{k5}{z}, [rbx+r11*8-256], 10
vpshufhw zmm24, zmm31, 10
vpshufhw zmm24, [rbx], 10
vpshufhw zmm24, [rbx+r11*8+256], 10
vpshufhw zmm24, [rbx+r11*8-256], 10
vpshufhw zmm24{k5}, zmm31, 10
vpshufhw zmm24{k5}, [rbx], 10
vpshufhw zmm24{k5}, [rbx+r11*8+256], 10
vpshufhw zmm24{k5}, [rbx+r11*8-256], 10
vpshufhw zmm24{k5}{z}, zmm31, 10
vpshufhw zmm24{k5}{z}, [rbx], 10
vpshufhw zmm24{k5}{z}, [rbx+r11*8+256], 10
vpshufhw zmm24{k5}{z}, [rbx+r11*8-256], 10
vpshuflw xmm2, xmm0, 10
vpshuflw xmm2, [rbx], 10
vpshuflw xmm2, [rbx+r11*8+256], 10
vpshuflw xmm2, [rbx+r11*8-256], 10
vpshuflw xmm2{k5}, xmm0, 10
vpshuflw xmm2{k5}, [rbx], 10
vpshuflw xmm2{k5}, [rbx+r11*8+256], 10
vpshuflw xmm2{k5}, [rbx+r11*8-256], 10
vpshuflw xmm2{k5}{z}, xmm0, 10
vpshuflw xmm2{k5}{z}, [rbx], 10
vpshuflw xmm2{k5}{z}, [rbx+r11*8+256], 10
vpshuflw xmm2{k5}{z}, [rbx+r11*8-256], 10
vpshuflw ymm16, ymm15, 10
vpshuflw ymm16, [rbx], 10
vpshuflw ymm16, [rbx+r11*8+256], 10
vpshuflw ymm16, [rbx+r11*8-256], 10
vpshuflw ymm16{k5}, ymm15, 10
vpshuflw ymm16{k5}, [rbx], 10
vpshuflw ymm16{k5}, [rbx+r11*8+256], 10
vpshuflw ymm16{k5}, [rbx+r11*8-256], 10
vpshuflw ymm16{k5}{z}, ymm15, 10
vpshuflw ymm16{k5}{z}, [rbx], 10
vpshuflw ymm16{k5}{z}, [rbx+r11*8+256], 10
vpshuflw ymm16{k5}{z}, [rbx+r11*8-256], 10
vpshuflw zmm24, zmm31, 10
vpshuflw zmm24, [rbx], 10
vpshuflw zmm24, [rbx+r11*8+256], 10
vpshuflw zmm24, [rbx+r11*8-256], 10
vpshuflw zmm24{k5}, zmm31, 10
vpshuflw zmm24{k5}, [rbx], 10
vpshuflw zmm24{k5}, [rbx+r11*8+256], 10
vpshuflw zmm24{k5}, [rbx+r11*8-256], 10
vpshuflw zmm24{k5}{z}, zmm31, 10
vpshuflw zmm24{k5}{z}, [rbx], 10
vpshuflw zmm24{k5}{z}, [rbx+r11*8+256], 10
vpshuflw zmm24{k5}{z}, [rbx+r11*8-256], 10
vpslldq xmm7, xmm0, 10
vpslldq xmm7, [rbx], 10
vpslldq xmm7, [rbx+r11*8+256], 10
vpslldq xmm7, [rbx+r11*8-256], 10
vpslldq ymm13, ymm15, 10
vpslldq ymm13, [rbx], 10
vpslldq ymm13, [rbx+r11*8+256], 10
vpslldq ymm13, [rbx+r11*8-256], 10
vpslldq zmm24, zmm31, 10
vpslldq zmm24, [rbx], 10
vpslldq zmm24, [rbx+r11*8+256], 10
vpslldq zmm24, [rbx+r11*8-256], 10
vpsllvw xmm2, xmm7, xmm0
vpsllvw xmm2, xmm7, [rbx]
vpsllvw xmm2, xmm7, [rbx+r11*8+256]
vpsllvw xmm2, xmm7, [rbx+r11*8-256]
vpsllvw xmm2{k5}, xmm7, xmm0
vpsllvw xmm2{k5}, xmm7, [rbx]
vpsllvw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsllvw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsllvw xmm2{k5}{z}, xmm7, xmm0
vpsllvw xmm2{k5}{z}, xmm7, [rbx]
vpsllvw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsllvw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsllvw ymm16, ymm13, ymm15
vpsllvw ymm16, ymm13, [rbx]
vpsllvw ymm16, ymm13, [rbx+r11*8+256]
vpsllvw ymm16, ymm13, [rbx+r11*8-256]
vpsllvw ymm16{k5}, ymm13, ymm15
vpsllvw ymm16{k5}, ymm13, [rbx]
vpsllvw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsllvw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsllvw ymm16{k5}{z}, ymm13, ymm15
vpsllvw ymm16{k5}{z}, ymm13, [rbx]
vpsllvw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsllvw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsllvw zmm24, zmm24, zmm31
vpsllvw zmm24, zmm24, [rbx]
vpsllvw zmm24, zmm24, [rbx+r11*8+256]
vpsllvw zmm24, zmm24, [rbx+r11*8-256]
vpsllvw zmm24{k5}, zmm24, zmm31
vpsllvw zmm24{k5}, zmm24, [rbx]
vpsllvw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsllvw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsllvw zmm24{k5}{z}, zmm24, zmm31
vpsllvw zmm24{k5}{z}, zmm24, [rbx]
vpsllvw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsllvw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsllw xmm7, xmm0, 10
vpsllw xmm7, [rbx], 10
vpsllw xmm7, [rbx+r11*8+256], 10
vpsllw xmm7, [rbx+r11*8-256], 10
vpsllw ymm13, ymm15, 10
vpsllw ymm13, [rbx], 10
vpsllw ymm13, [rbx+r11*8+256], 10
vpsllw ymm13, [rbx+r11*8-256], 10
vpsllw zmm24, zmm31, 10
vpsllw zmm24, [rbx], 10
vpsllw zmm24, [rbx+r11*8+256], 10
vpsllw zmm24, [rbx+r11*8-256], 10
vpsllw xmm2, xmm7, xmm0
vpsllw xmm2, xmm7, [rbx]
vpsllw xmm2, xmm7, [rbx+r11*8+256]
vpsllw xmm2, xmm7, [rbx+r11*8-256]
vpsllw xmm2{k5}, xmm7, xmm0
vpsllw xmm2{k5}, xmm7, [rbx]
vpsllw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsllw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsllw xmm2{k5}{z}, xmm7, xmm0
vpsllw xmm2{k5}{z}, xmm7, [rbx]
vpsllw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsllw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsllw ymm16, ymm13, xmm0
vpsllw ymm16, ymm13, [rbx]
vpsllw ymm16, ymm13, [rbx+r11*8+256]
vpsllw ymm16, ymm13, [rbx+r11*8-256]
vpsllw ymm16{k5}, ymm13, xmm0
vpsllw ymm16{k5}, ymm13, [rbx]
vpsllw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsllw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsllw ymm16{k5}{z}, ymm13, xmm0
vpsllw ymm16{k5}{z}, ymm13, [rbx]
vpsllw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsllw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsllw zmm24, zmm24, xmm0
vpsllw zmm24, zmm24, [rbx]
vpsllw zmm24, zmm24, [rbx+r11*8+256]
vpsllw zmm24, zmm24, [rbx+r11*8-256]
vpsllw zmm24{k5}, zmm24, xmm0
vpsllw zmm24{k5}, zmm24, [rbx]
vpsllw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsllw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsllw zmm24{k5}{z}, zmm24, xmm0
vpsllw zmm24{k5}{z}, zmm24, [rbx]
vpsllw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsllw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsravw xmm2, xmm7, xmm0
vpsravw xmm2, xmm7, [rbx]
vpsravw xmm2, xmm7, [rbx+r11*8+256]
vpsravw xmm2, xmm7, [rbx+r11*8-256]
vpsravw xmm2{k5}, xmm7, xmm0
vpsravw xmm2{k5}, xmm7, [rbx]
vpsravw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsravw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsravw xmm2{k5}{z}, xmm7, xmm0
vpsravw xmm2{k5}{z}, xmm7, [rbx]
vpsravw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsravw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsravw ymm16, ymm13, ymm15
vpsravw ymm16, ymm13, [rbx]
vpsravw ymm16, ymm13, [rbx+r11*8+256]
vpsravw ymm16, ymm13, [rbx+r11*8-256]
vpsravw ymm16{k5}, ymm13, ymm15
vpsravw ymm16{k5}, ymm13, [rbx]
vpsravw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsravw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsravw ymm16{k5}{z}, ymm13, ymm15
vpsravw ymm16{k5}{z}, ymm13, [rbx]
vpsravw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsravw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsravw zmm24, zmm24, zmm31
vpsravw zmm24, zmm24, [rbx]
vpsravw zmm24, zmm24, [rbx+r11*8+256]
vpsravw zmm24, zmm24, [rbx+r11*8-256]
vpsravw zmm24{k5}, zmm24, zmm31
vpsravw zmm24{k5}, zmm24, [rbx]
vpsravw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsravw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsravw zmm24{k5}{z}, zmm24, zmm31
vpsravw zmm24{k5}{z}, zmm24, [rbx]
vpsravw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsravw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsraw xmm7, xmm0, 10
vpsraw xmm7, [rbx], 10
vpsraw xmm7, [rbx+r11*8+256], 10
vpsraw xmm7, [rbx+r11*8-256], 10
vpsraw ymm13, ymm15, 10
vpsraw ymm13, [rbx], 10
vpsraw ymm13, [rbx+r11*8+256], 10
vpsraw ymm13, [rbx+r11*8-256], 10
vpsraw zmm24, zmm31, 10
vpsraw zmm24, [rbx], 10
vpsraw zmm24, [rbx+r11*8+256], 10
vpsraw zmm24, [rbx+r11*8-256], 10
vpsraw xmm2, xmm7, xmm0
vpsraw xmm2, xmm7, [rbx]
vpsraw xmm2, xmm7, [rbx+r11*8+256]
vpsraw xmm2, xmm7, [rbx+r11*8-256]
vpsraw xmm2{k5}, xmm7, xmm0
vpsraw xmm2{k5}, xmm7, [rbx]
vpsraw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsraw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsraw xmm2{k5}{z}, xmm7, xmm0
vpsraw xmm2{k5}{z}, xmm7, [rbx]
vpsraw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsraw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsraw ymm16, ymm13, xmm0
vpsraw ymm16, ymm13, [rbx]
vpsraw ymm16, ymm13, [rbx+r11*8+256]
vpsraw ymm16, ymm13, [rbx+r11*8-256]
vpsraw ymm16{k5}, ymm13, xmm0
vpsraw ymm16{k5}, ymm13, [rbx]
vpsraw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsraw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsraw ymm16{k5}{z}, ymm13, xmm0
vpsraw ymm16{k5}{z}, ymm13, [rbx]
vpsraw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsraw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsraw zmm24, zmm24, xmm0
vpsraw zmm24, zmm24, [rbx]
vpsraw zmm24, zmm24, [rbx+r11*8+256]
vpsraw zmm24, zmm24, [rbx+r11*8-256]
vpsraw zmm24{k5}, zmm24, xmm0
vpsraw zmm24{k5}, zmm24, [rbx]
vpsraw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsraw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsraw zmm24{k5}{z}, zmm24, xmm0
vpsraw zmm24{k5}{z}, zmm24, [rbx]
vpsraw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsraw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsrldq xmm7, xmm0, 10
vpsrldq xmm7, [rbx], 10
vpsrldq xmm7, [rbx+r11*8+256], 10
vpsrldq xmm7, [rbx+r11*8-256], 10
vpsrldq ymm13, ymm15, 10
vpsrldq ymm13, [rbx], 10
vpsrldq ymm13, [rbx+r11*8+256], 10
vpsrldq ymm13, [rbx+r11*8-256], 10
vpsrldq zmm24, zmm31, 10
vpsrldq zmm24, [rbx], 10
vpsrldq zmm24, [rbx+r11*8+256], 10
vpsrldq zmm24, [rbx+r11*8-256], 10
vpsrlvw xmm2, xmm7, xmm0
vpsrlvw xmm2, xmm7, [rbx]
vpsrlvw xmm2, xmm7, [rbx+r11*8+256]
vpsrlvw xmm2, xmm7, [rbx+r11*8-256]
vpsrlvw xmm2{k5}, xmm7, xmm0
vpsrlvw xmm2{k5}, xmm7, [rbx]
vpsrlvw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsrlvw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsrlvw xmm2{k5}{z}, xmm7, xmm0
vpsrlvw xmm2{k5}{z}, xmm7, [rbx]
vpsrlvw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsrlvw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsrlvw ymm16, ymm13, ymm15
vpsrlvw ymm16, ymm13, [rbx]
vpsrlvw ymm16, ymm13, [rbx+r11*8+256]
vpsrlvw ymm16, ymm13, [rbx+r11*8-256]
vpsrlvw ymm16{k5}, ymm13, ymm15
vpsrlvw ymm16{k5}, ymm13, [rbx]
vpsrlvw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsrlvw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsrlvw ymm16{k5}{z}, ymm13, ymm15
vpsrlvw ymm16{k5}{z}, ymm13, [rbx]
vpsrlvw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsrlvw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsrlvw zmm24, zmm24, zmm31
vpsrlvw zmm24, zmm24, [rbx]
vpsrlvw zmm24, zmm24, [rbx+r11*8+256]
vpsrlvw zmm24, zmm24, [rbx+r11*8-256]
vpsrlvw zmm24{k5}, zmm24, zmm31
vpsrlvw zmm24{k5}, zmm24, [rbx]
vpsrlvw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsrlvw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsrlvw zmm24{k5}{z}, zmm24, zmm31
vpsrlvw zmm24{k5}{z}, zmm24, [rbx]
vpsrlvw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsrlvw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsrlw xmm7, xmm0, 10
vpsrlw xmm7, [rbx], 10
vpsrlw xmm7, [rbx+r11*8+256], 10
vpsrlw xmm7, [rbx+r11*8-256], 10
vpsrlw ymm13, ymm15, 10
vpsrlw ymm13, [rbx], 10
vpsrlw ymm13, [rbx+r11*8+256], 10
vpsrlw ymm13, [rbx+r11*8-256], 10
vpsrlw zmm24, zmm31, 10
vpsrlw zmm24, [rbx], 10
vpsrlw zmm24, [rbx+r11*8+256], 10
vpsrlw zmm24, [rbx+r11*8-256], 10
vpsrlw xmm2, xmm7, xmm0
vpsrlw xmm2, xmm7, [rbx]
vpsrlw xmm2, xmm7, [rbx+r11*8+256]
vpsrlw xmm2, xmm7, [rbx+r11*8-256]
vpsrlw xmm2{k5}, xmm7, xmm0
vpsrlw xmm2{k5}, xmm7, [rbx]
vpsrlw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsrlw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsrlw xmm2{k5}{z}, xmm7, xmm0
vpsrlw xmm2{k5}{z}, xmm7, [rbx]
vpsrlw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsrlw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsrlw ymm16, ymm13, xmm0
vpsrlw ymm16, ymm13, [rbx]
vpsrlw ymm16, ymm13, [rbx+r11*8+256]
vpsrlw ymm16, ymm13, [rbx+r11*8-256]
vpsrlw ymm16{k5}, ymm13, xmm0
vpsrlw ymm16{k5}, ymm13, [rbx]
vpsrlw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsrlw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsrlw ymm16{k5}{z}, ymm13, xmm0
vpsrlw ymm16{k5}{z}, ymm13, [rbx]
vpsrlw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsrlw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsrlw zmm24, zmm24, xmm0
vpsrlw zmm24, zmm24, [rbx]
vpsrlw zmm24, zmm24, [rbx+r11*8+256]
vpsrlw zmm24, zmm24, [rbx+r11*8-256]
vpsrlw zmm24{k5}, zmm24, xmm0
vpsrlw zmm24{k5}, zmm24, [rbx]
vpsrlw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsrlw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsrlw zmm24{k5}{z}, zmm24, xmm0
vpsrlw zmm24{k5}{z}, zmm24, [rbx]
vpsrlw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsrlw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsubb xmm2, xmm7, xmm0
vpsubb xmm2, xmm7, [rbx]
vpsubb xmm2, xmm7, [rbx+r11*8+256]
vpsubb xmm2, xmm7, [rbx+r11*8-256]
vpsubb xmm2{k5}, xmm7, xmm0
vpsubb xmm2{k5}, xmm7, [rbx]
vpsubb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsubb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsubb xmm2{k5}{z}, xmm7, xmm0
vpsubb xmm2{k5}{z}, xmm7, [rbx]
vpsubb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsubb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsubb ymm16, ymm13, ymm15
vpsubb ymm16, ymm13, [rbx]
vpsubb ymm16, ymm13, [rbx+r11*8+256]
vpsubb ymm16, ymm13, [rbx+r11*8-256]
vpsubb ymm16{k5}, ymm13, ymm15
vpsubb ymm16{k5}, ymm13, [rbx]
vpsubb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsubb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsubb ymm16{k5}{z}, ymm13, ymm15
vpsubb ymm16{k5}{z}, ymm13, [rbx]
vpsubb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsubb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsubb zmm24, zmm24, zmm31
vpsubb zmm24, zmm24, [rbx]
vpsubb zmm24, zmm24, [rbx+r11*8+256]
vpsubb zmm24, zmm24, [rbx+r11*8-256]
vpsubb zmm24{k5}, zmm24, zmm31
vpsubb zmm24{k5}, zmm24, [rbx]
vpsubb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsubb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsubb zmm24{k5}{z}, zmm24, zmm31
vpsubb zmm24{k5}{z}, zmm24, [rbx]
vpsubb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsubb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsubsb xmm2, xmm7, xmm0
vpsubsb xmm2, xmm7, [rbx]
vpsubsb xmm2, xmm7, [rbx+r11*8+256]
vpsubsb xmm2, xmm7, [rbx+r11*8-256]
vpsubsb xmm2{k5}, xmm7, xmm0
vpsubsb xmm2{k5}, xmm7, [rbx]
vpsubsb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsubsb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsubsb xmm2{k5}{z}, xmm7, xmm0
vpsubsb xmm2{k5}{z}, xmm7, [rbx]
vpsubsb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsubsb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsubsb ymm16, ymm13, ymm15
vpsubsb ymm16, ymm13, [rbx]
vpsubsb ymm16, ymm13, [rbx+r11*8+256]
vpsubsb ymm16, ymm13, [rbx+r11*8-256]
vpsubsb ymm16{k5}, ymm13, ymm15
vpsubsb ymm16{k5}, ymm13, [rbx]
vpsubsb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsubsb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsubsb ymm16{k5}{z}, ymm13, ymm15
vpsubsb ymm16{k5}{z}, ymm13, [rbx]
vpsubsb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsubsb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsubsb zmm24, zmm24, zmm31
vpsubsb zmm24, zmm24, [rbx]
vpsubsb zmm24, zmm24, [rbx+r11*8+256]
vpsubsb zmm24, zmm24, [rbx+r11*8-256]
vpsubsb zmm24{k5}, zmm24, zmm31
vpsubsb zmm24{k5}, zmm24, [rbx]
vpsubsb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsubsb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsubsb zmm24{k5}{z}, zmm24, zmm31
vpsubsb zmm24{k5}{z}, zmm24, [rbx]
vpsubsb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsubsb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsubsw xmm2, xmm7, xmm0
vpsubsw xmm2, xmm7, [rbx]
vpsubsw xmm2, xmm7, [rbx+r11*8+256]
vpsubsw xmm2, xmm7, [rbx+r11*8-256]
vpsubsw xmm2{k5}, xmm7, xmm0
vpsubsw xmm2{k5}, xmm7, [rbx]
vpsubsw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsubsw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsubsw xmm2{k5}{z}, xmm7, xmm0
vpsubsw xmm2{k5}{z}, xmm7, [rbx]
vpsubsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsubsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsubsw ymm16, ymm13, ymm15
vpsubsw ymm16, ymm13, [rbx]
vpsubsw ymm16, ymm13, [rbx+r11*8+256]
vpsubsw ymm16, ymm13, [rbx+r11*8-256]
vpsubsw ymm16{k5}, ymm13, ymm15
vpsubsw ymm16{k5}, ymm13, [rbx]
vpsubsw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsubsw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsubsw ymm16{k5}{z}, ymm13, ymm15
vpsubsw ymm16{k5}{z}, ymm13, [rbx]
vpsubsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsubsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsubsw zmm24, zmm24, zmm31
vpsubsw zmm24, zmm24, [rbx]
vpsubsw zmm24, zmm24, [rbx+r11*8+256]
vpsubsw zmm24, zmm24, [rbx+r11*8-256]
vpsubsw zmm24{k5}, zmm24, zmm31
vpsubsw zmm24{k5}, zmm24, [rbx]
vpsubsw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsubsw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsubsw zmm24{k5}{z}, zmm24, zmm31
vpsubsw zmm24{k5}{z}, zmm24, [rbx]
vpsubsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsubsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsubusb xmm2, xmm7, xmm0
vpsubusb xmm2, xmm7, [rbx]
vpsubusb xmm2, xmm7, [rbx+r11*8+256]
vpsubusb xmm2, xmm7, [rbx+r11*8-256]
vpsubusb xmm2{k5}, xmm7, xmm0
vpsubusb xmm2{k5}, xmm7, [rbx]
vpsubusb xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsubusb xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsubusb xmm2{k5}{z}, xmm7, xmm0
vpsubusb xmm2{k5}{z}, xmm7, [rbx]
vpsubusb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsubusb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsubusb ymm16, ymm13, ymm15
vpsubusb ymm16, ymm13, [rbx]
vpsubusb ymm16, ymm13, [rbx+r11*8+256]
vpsubusb ymm16, ymm13, [rbx+r11*8-256]
vpsubusb ymm16{k5}, ymm13, ymm15
vpsubusb ymm16{k5}, ymm13, [rbx]
vpsubusb ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsubusb ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsubusb ymm16{k5}{z}, ymm13, ymm15
vpsubusb ymm16{k5}{z}, ymm13, [rbx]
vpsubusb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsubusb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsubusb zmm24, zmm24, zmm31
vpsubusb zmm24, zmm24, [rbx]
vpsubusb zmm24, zmm24, [rbx+r11*8+256]
vpsubusb zmm24, zmm24, [rbx+r11*8-256]
vpsubusb zmm24{k5}, zmm24, zmm31
vpsubusb zmm24{k5}, zmm24, [rbx]
vpsubusb zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsubusb zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsubusb zmm24{k5}{z}, zmm24, zmm31
vpsubusb zmm24{k5}{z}, zmm24, [rbx]
vpsubusb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsubusb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsubusw xmm2, xmm7, xmm0
vpsubusw xmm2, xmm7, [rbx]
vpsubusw xmm2, xmm7, [rbx+r11*8+256]
vpsubusw xmm2, xmm7, [rbx+r11*8-256]
vpsubusw xmm2{k5}, xmm7, xmm0
vpsubusw xmm2{k5}, xmm7, [rbx]
vpsubusw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsubusw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsubusw xmm2{k5}{z}, xmm7, xmm0
vpsubusw xmm2{k5}{z}, xmm7, [rbx]
vpsubusw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsubusw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsubusw ymm16, ymm13, ymm15
vpsubusw ymm16, ymm13, [rbx]
vpsubusw ymm16, ymm13, [rbx+r11*8+256]
vpsubusw ymm16, ymm13, [rbx+r11*8-256]
vpsubusw ymm16{k5}, ymm13, ymm15
vpsubusw ymm16{k5}, ymm13, [rbx]
vpsubusw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsubusw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsubusw ymm16{k5}{z}, ymm13, ymm15
vpsubusw ymm16{k5}{z}, ymm13, [rbx]
vpsubusw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsubusw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsubusw zmm24, zmm24, zmm31
vpsubusw zmm24, zmm24, [rbx]
vpsubusw zmm24, zmm24, [rbx+r11*8+256]
vpsubusw zmm24, zmm24, [rbx+r11*8-256]
vpsubusw zmm24{k5}, zmm24, zmm31
vpsubusw zmm24{k5}, zmm24, [rbx]
vpsubusw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsubusw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsubusw zmm24{k5}{z}, zmm24, zmm31
vpsubusw zmm24{k5}{z}, zmm24, [rbx]
vpsubusw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsubusw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpsubw xmm2, xmm7, xmm0
vpsubw xmm2, xmm7, [rbx]
vpsubw xmm2, xmm7, [rbx+r11*8+256]
vpsubw xmm2, xmm7, [rbx+r11*8-256]
vpsubw xmm2{k5}, xmm7, xmm0
vpsubw xmm2{k5}, xmm7, [rbx]
vpsubw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpsubw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpsubw xmm2{k5}{z}, xmm7, xmm0
vpsubw xmm2{k5}{z}, xmm7, [rbx]
vpsubw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpsubw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpsubw ymm16, ymm13, ymm15
vpsubw ymm16, ymm13, [rbx]
vpsubw ymm16, ymm13, [rbx+r11*8+256]
vpsubw ymm16, ymm13, [rbx+r11*8-256]
vpsubw ymm16{k5}, ymm13, ymm15
vpsubw ymm16{k5}, ymm13, [rbx]
vpsubw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpsubw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpsubw ymm16{k5}{z}, ymm13, ymm15
vpsubw ymm16{k5}{z}, ymm13, [rbx]
vpsubw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpsubw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpsubw zmm24, zmm24, zmm31
vpsubw zmm24, zmm24, [rbx]
vpsubw zmm24, zmm24, [rbx+r11*8+256]
vpsubw zmm24, zmm24, [rbx+r11*8-256]
vpsubw zmm24{k5}, zmm24, zmm31
vpsubw zmm24{k5}, zmm24, [rbx]
vpsubw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpsubw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpsubw zmm24{k5}{z}, zmm24, zmm31
vpsubw zmm24{k5}{z}, zmm24, [rbx]
vpsubw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpsubw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vptestmb k3, xmm7, xmm0
vptestmb k3, xmm7, [rbx]
vptestmb k3, xmm7, [rbx+r11*8+256]
vptestmb k3, xmm7, [rbx+r11*8-256]
vptestmb k3, ymm13, ymm15
vptestmb k3, ymm13, [rbx]
vptestmb k3, ymm13, [rbx+r11*8+256]
vptestmb k3, ymm13, [rbx+r11*8-256]
vptestmb k3, zmm24, zmm31
vptestmb k3, zmm24, [rbx]
vptestmb k3, zmm24, [rbx+r11*8+256]
vptestmb k3, zmm24, [rbx+r11*8-256]
vptestmb k3{k5}, xmm7, xmm0
vptestmb k3{k5}, xmm7, [rbx]
vptestmb k3{k5}, xmm7, [rbx+r11*8+256]
vptestmb k3{k5}, xmm7, [rbx+r11*8-256]
vptestmb k3{k5}, ymm13, ymm15
vptestmb k3{k5}, ymm13, [rbx]
vptestmb k3{k5}, ymm13, [rbx+r11*8+256]
vptestmb k3{k5}, ymm13, [rbx+r11*8-256]
vptestmb k3{k5}, zmm24, zmm31
vptestmb k3{k5}, zmm24, [rbx]
vptestmb k3{k5}, zmm24, [rbx+r11*8+256]
vptestmb k3{k5}, zmm24, [rbx+r11*8-256]
vptestmw k3, xmm7, xmm0
vptestmw k3, xmm7, [rbx]
vptestmw k3, xmm7, [rbx+r11*8+256]
vptestmw k3, xmm7, [rbx+r11*8-256]
vptestmw k3, ymm13, ymm15
vptestmw k3, ymm13, [rbx]
vptestmw k3, ymm13, [rbx+r11*8+256]
vptestmw k3, ymm13, [rbx+r11*8-256]
vptestmw k3, zmm24, zmm31
vptestmw k3, zmm24, [rbx]
vptestmw k3, zmm24, [rbx+r11*8+256]
vptestmw k3, zmm24, [rbx+r11*8-256]
vptestmw k3{k5}, xmm7, xmm0
vptestmw k3{k5}, xmm7, [rbx]
vptestmw k3{k5}, xmm7, [rbx+r11*8+256]
vptestmw k3{k5}, xmm7, [rbx+r11*8-256]
vptestmw k3{k5}, ymm13, ymm15
vptestmw k3{k5}, ymm13, [rbx]
vptestmw k3{k5}, ymm13, [rbx+r11*8+256]
vptestmw k3{k5}, ymm13, [rbx+r11*8-256]
vptestmw k3{k5}, zmm24, zmm31
vptestmw k3{k5}, zmm24, [rbx]
vptestmw k3{k5}, zmm24, [rbx+r11*8+256]
vptestmw k3{k5}, zmm24, [rbx+r11*8-256]
vptestnmb k3, xmm7, xmm0
vptestnmb k3, xmm7, [rbx]
vptestnmb k3, xmm7, [rbx+r11*8+256]
vptestnmb k3, xmm7, [rbx+r11*8-256]
vptestnmb k3, ymm13, ymm15
vptestnmb k3, ymm13, [rbx]
vptestnmb k3, ymm13, [rbx+r11*8+256]
vptestnmb k3, ymm13, [rbx+r11*8-256]
vptestnmb k3, zmm24, zmm31
vptestnmb k3, zmm24, [rbx]
vptestnmb k3, zmm24, [rbx+r11*8+256]
vptestnmb k3, zmm24, [rbx+r11*8-256]
vptestnmb k3{k5}, xmm7, xmm0
vptestnmb k3{k5}, xmm7, [rbx]
vptestnmb k3{k5}, xmm7, [rbx+r11*8+256]
vptestnmb k3{k5}, xmm7, [rbx+r11*8-256]
vptestnmb k3{k5}, ymm13, ymm15
vptestnmb k3{k5}, ymm13, [rbx]
vptestnmb k3{k5}, ymm13, [rbx+r11*8+256]
vptestnmb k3{k5}, ymm13, [rbx+r11*8-256]
vptestnmb k3{k5}, zmm24, zmm31
vptestnmb k3{k5}, zmm24, [rbx]
vptestnmb k3{k5}, zmm24, [rbx+r11*8+256]
vptestnmb k3{k5}, zmm24, [rbx+r11*8-256]
vptestnmw k3, xmm7, xmm0
vptestnmw k3, xmm7, [rbx]
vptestnmw k3, xmm7, [rbx+r11*8+256]
vptestnmw k3, xmm7, [rbx+r11*8-256]
vptestnmw k3, ymm13, ymm15
vptestnmw k3, ymm13, [rbx]
vptestnmw k3, ymm13, [rbx+r11*8+256]
vptestnmw k3, ymm13, [rbx+r11*8-256]
vptestnmw k3, zmm24, zmm31
vptestnmw k3, zmm24, [rbx]
vptestnmw k3, zmm24, [rbx+r11*8+256]
vptestnmw k3, zmm24, [rbx+r11*8-256]
vptestnmw k3{k5}, xmm7, xmm0
vptestnmw k3{k5}, xmm7, [rbx]
vptestnmw k3{k5}, xmm7, [rbx+r11*8+256]
vptestnmw k3{k5}, xmm7, [rbx+r11*8-256]
vptestnmw k3{k5}, ymm13, ymm15
vptestnmw k3{k5}, ymm13, [rbx]
vptestnmw k3{k5}, ymm13, [rbx+r11*8+256]
vptestnmw k3{k5}, ymm13, [rbx+r11*8-256]
vptestnmw k3{k5}, zmm24, zmm31
vptestnmw k3{k5}, zmm24, [rbx]
vptestnmw k3{k5}, zmm24, [rbx+r11*8+256]
vptestnmw k3{k5}, zmm24, [rbx+r11*8-256]
vpunpckhbw xmm2, xmm7, xmm0
vpunpckhbw xmm2, xmm7, [rbx]
vpunpckhbw xmm2, xmm7, [rbx+r11*8+256]
vpunpckhbw xmm2, xmm7, [rbx+r11*8-256]
vpunpckhbw xmm2{k5}, xmm7, xmm0
vpunpckhbw xmm2{k5}, xmm7, [rbx]
vpunpckhbw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpunpckhbw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpunpckhbw xmm2{k5}{z}, xmm7, xmm0
vpunpckhbw xmm2{k5}{z}, xmm7, [rbx]
vpunpckhbw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpunpckhbw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpunpckhbw ymm16, ymm13, ymm15
vpunpckhbw ymm16, ymm13, [rbx]
vpunpckhbw ymm16, ymm13, [rbx+r11*8+256]
vpunpckhbw ymm16, ymm13, [rbx+r11*8-256]
vpunpckhbw ymm16{k5}, ymm13, ymm15
vpunpckhbw ymm16{k5}, ymm13, [rbx]
vpunpckhbw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpunpckhbw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpunpckhbw ymm16{k5}{z}, ymm13, ymm15
vpunpckhbw ymm16{k5}{z}, ymm13, [rbx]
vpunpckhbw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpunpckhbw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpunpckhbw zmm24, zmm24, zmm31
vpunpckhbw zmm24, zmm24, [rbx]
vpunpckhbw zmm24, zmm24, [rbx+r11*8+256]
vpunpckhbw zmm24, zmm24, [rbx+r11*8-256]
vpunpckhbw zmm24{k5}, zmm24, zmm31
vpunpckhbw zmm24{k5}, zmm24, [rbx]
vpunpckhbw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpunpckhbw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpunpckhbw zmm24{k5}{z}, zmm24, zmm31
vpunpckhbw zmm24{k5}{z}, zmm24, [rbx]
vpunpckhbw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpunpckhbw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpunpckhwd xmm2, xmm7, xmm0
vpunpckhwd xmm2, xmm7, [rbx]
vpunpckhwd xmm2, xmm7, [rbx+r11*8+256]
vpunpckhwd xmm2, xmm7, [rbx+r11*8-256]
vpunpckhwd xmm2{k5}, xmm7, xmm0
vpunpckhwd xmm2{k5}, xmm7, [rbx]
vpunpckhwd xmm2{k5}, xmm7, [rbx+r11*8+256]
vpunpckhwd xmm2{k5}, xmm7, [rbx+r11*8-256]
vpunpckhwd xmm2{k5}{z}, xmm7, xmm0
vpunpckhwd xmm2{k5}{z}, xmm7, [rbx]
vpunpckhwd xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpunpckhwd xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpunpckhwd ymm16, ymm13, ymm15
vpunpckhwd ymm16, ymm13, [rbx]
vpunpckhwd ymm16, ymm13, [rbx+r11*8+256]
vpunpckhwd ymm16, ymm13, [rbx+r11*8-256]
vpunpckhwd ymm16{k5}, ymm13, ymm15
vpunpckhwd ymm16{k5}, ymm13, [rbx]
vpunpckhwd ymm16{k5}, ymm13, [rbx+r11*8+256]
vpunpckhwd ymm16{k5}, ymm13, [rbx+r11*8-256]
vpunpckhwd ymm16{k5}{z}, ymm13, ymm15
vpunpckhwd ymm16{k5}{z}, ymm13, [rbx]
vpunpckhwd ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpunpckhwd ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpunpckhwd zmm24, zmm24, zmm31
vpunpckhwd zmm24, zmm24, [rbx]
vpunpckhwd zmm24, zmm24, [rbx+r11*8+256]
vpunpckhwd zmm24, zmm24, [rbx+r11*8-256]
vpunpckhwd zmm24{k5}, zmm24, zmm31
vpunpckhwd zmm24{k5}, zmm24, [rbx]
vpunpckhwd zmm24{k5}, zmm24, [rbx+r11*8+256]
vpunpckhwd zmm24{k5}, zmm24, [rbx+r11*8-256]
vpunpckhwd zmm24{k5}{z}, zmm24, zmm31
vpunpckhwd zmm24{k5}{z}, zmm24, [rbx]
vpunpckhwd zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpunpckhwd zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpunpcklbw xmm2, xmm7, xmm0
vpunpcklbw xmm2, xmm7, [rbx]
vpunpcklbw xmm2, xmm7, [rbx+r11*8+256]
vpunpcklbw xmm2, xmm7, [rbx+r11*8-256]
vpunpcklbw xmm2{k5}, xmm7, xmm0
vpunpcklbw xmm2{k5}, xmm7, [rbx]
vpunpcklbw xmm2{k5}, xmm7, [rbx+r11*8+256]
vpunpcklbw xmm2{k5}, xmm7, [rbx+r11*8-256]
vpunpcklbw xmm2{k5}{z}, xmm7, xmm0
vpunpcklbw xmm2{k5}{z}, xmm7, [rbx]
vpunpcklbw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpunpcklbw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpunpcklbw ymm16, ymm13, ymm15
vpunpcklbw ymm16, ymm13, [rbx]
vpunpcklbw ymm16, ymm13, [rbx+r11*8+256]
vpunpcklbw ymm16, ymm13, [rbx+r11*8-256]
vpunpcklbw ymm16{k5}, ymm13, ymm15
vpunpcklbw ymm16{k5}, ymm13, [rbx]
vpunpcklbw ymm16{k5}, ymm13, [rbx+r11*8+256]
vpunpcklbw ymm16{k5}, ymm13, [rbx+r11*8-256]
vpunpcklbw ymm16{k5}{z}, ymm13, ymm15
vpunpcklbw ymm16{k5}{z}, ymm13, [rbx]
vpunpcklbw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpunpcklbw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpunpcklbw zmm24, zmm24, zmm31
vpunpcklbw zmm24, zmm24, [rbx]
vpunpcklbw zmm24, zmm24, [rbx+r11*8+256]
vpunpcklbw zmm24, zmm24, [rbx+r11*8-256]
vpunpcklbw zmm24{k5}, zmm24, zmm31
vpunpcklbw zmm24{k5}, zmm24, [rbx]
vpunpcklbw zmm24{k5}, zmm24, [rbx+r11*8+256]
vpunpcklbw zmm24{k5}, zmm24, [rbx+r11*8-256]
vpunpcklbw zmm24{k5}{z}, zmm24, zmm31
vpunpcklbw zmm24{k5}{z}, zmm24, [rbx]
vpunpcklbw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpunpcklbw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
vpunpcklwd xmm2, xmm7, xmm0
vpunpcklwd xmm2, xmm7, [rbx]
vpunpcklwd xmm2, xmm7, [rbx+r11*8+256]
vpunpcklwd xmm2, xmm7, [rbx+r11*8-256]
vpunpcklwd xmm2{k5}, xmm7, xmm0
vpunpcklwd xmm2{k5}, xmm7, [rbx]
vpunpcklwd xmm2{k5}, xmm7, [rbx+r11*8+256]
vpunpcklwd xmm2{k5}, xmm7, [rbx+r11*8-256]
vpunpcklwd xmm2{k5}{z}, xmm7, xmm0
vpunpcklwd xmm2{k5}{z}, xmm7, [rbx]
vpunpcklwd xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
vpunpcklwd xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
vpunpcklwd ymm16, ymm13, ymm15
vpunpcklwd ymm16, ymm13, [rbx]
vpunpcklwd ymm16, ymm13, [rbx+r11*8+256]
vpunpcklwd ymm16, ymm13, [rbx+r11*8-256]
vpunpcklwd ymm16{k5}, ymm13, ymm15
vpunpcklwd ymm16{k5}, ymm13, [rbx]
vpunpcklwd ymm16{k5}, ymm13, [rbx+r11*8+256]
vpunpcklwd ymm16{k5}, ymm13, [rbx+r11*8-256]
vpunpcklwd ymm16{k5}{z}, ymm13, ymm15
vpunpcklwd ymm16{k5}{z}, ymm13, [rbx]
vpunpcklwd ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
vpunpcklwd ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
vpunpcklwd zmm24, zmm24, zmm31
vpunpcklwd zmm24, zmm24, [rbx]
vpunpcklwd zmm24, zmm24, [rbx+r11*8+256]
vpunpcklwd zmm24, zmm24, [rbx+r11*8-256]
vpunpcklwd zmm24{k5}, zmm24, zmm31
vpunpcklwd zmm24{k5}, zmm24, [rbx]
vpunpcklwd zmm24{k5}, zmm24, [rbx+r11*8+256]
vpunpcklwd zmm24{k5}, zmm24, [rbx+r11*8-256]
vpunpcklwd zmm24{k5}{z}, zmm24, zmm31
vpunpcklwd zmm24{k5}{z}, zmm24, [rbx]
vpunpcklwd zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
vpunpcklwd zmm24{k5}{z}, zmm24, [rbx+r11*8-256]