mirror of
https://github.com/bitdefender/bddisasm.git
synced 2024-11-24 08:28:07 +00:00
76d92e73c2
- Add support for AVX512-FP16 instructions, as per https://software.intel.com/content/www/us/en/develop/download/intel-avx512-fp16-architecture-specification.html - Bug fix: zeroing with no masking is not supported, so return an error if we encounter such encodings - Bug fix: ignore VEX/EVEX.W field outside 64 bit mode for some instructions - Several other minor fixes and improvements
2746 lines
104 KiB
NASM
2746 lines
104 KiB
NASM
bits 64
|
|
|
|
kaddd k3, k7, k1
|
|
kaddq k3, k7, k1
|
|
kandd k3, k7, k1
|
|
kandnd k3, k7, k1
|
|
kandnq k3, k7, k1
|
|
kandq k3, k7, k1
|
|
kmovd k3, [rbx]
|
|
kmovd k3, [rbx+rsi*8+256]
|
|
kmovd k3, [rbx+rsi*8-256]
|
|
kmovd k3, k1
|
|
kmovd k3, [rbx]
|
|
kmovd [rbx], k3
|
|
kmovd [rbx+rsi*8+256], k3
|
|
kmovd [rbx+rsi*8-256], k3
|
|
kmovd k3, ecx
|
|
kmovd ecx, k1
|
|
kmovq k3, [rbx]
|
|
kmovq k3, [rbx+rsi*8+256]
|
|
kmovq k3, [rbx+rsi*8-256]
|
|
kmovq k3, k1
|
|
kmovq k3, [rbx]
|
|
kmovq [rbx], k3
|
|
kmovq [rbx+rsi*8+256], k3
|
|
kmovq [rbx+rsi*8-256], k3
|
|
kmovq k3, rcx
|
|
kmovq rcx, k1
|
|
knotd k3, k1
|
|
knotq k3, k1
|
|
kord k3, k7, k1
|
|
korq k3, k7, k1
|
|
kortestd k3, k1
|
|
kortestq k3, k1
|
|
kshiftld k3, k1, 10
|
|
kshiftlq k3, k1, 10
|
|
kshiftrd k3, k1, 10
|
|
kshiftrq k3, k1, 10
|
|
ktestd k3, k1
|
|
ktestq k3, k1
|
|
kunpckdq k3, k7, k1
|
|
kunpckwd k3, k7, k1
|
|
kxnord k3, k7, k1
|
|
kxnorq k3, k7, k1
|
|
kxord k3, k7, k1
|
|
kxorq k3, k7, k1
|
|
vdbpsadbw xmm2, xmm7, xmm0, 10
|
|
vdbpsadbw xmm2, xmm7, [rbx], 10
|
|
vdbpsadbw xmm2, xmm7, [rbx+r11*8+256], 10
|
|
vdbpsadbw xmm2, xmm7, [rbx+r11*8-256], 10
|
|
vdbpsadbw xmm2{k5}, xmm7, xmm0, 10
|
|
vdbpsadbw xmm2{k5}, xmm7, [rbx], 10
|
|
vdbpsadbw xmm2{k5}, xmm7, [rbx+r11*8+256], 10
|
|
vdbpsadbw xmm2{k5}, xmm7, [rbx+r11*8-256], 10
|
|
vdbpsadbw xmm2{k5}{z}, xmm7, xmm0, 10
|
|
vdbpsadbw xmm2{k5}{z}, xmm7, [rbx], 10
|
|
vdbpsadbw xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10
|
|
vdbpsadbw xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10
|
|
vdbpsadbw ymm16, ymm13, ymm15, 10
|
|
vdbpsadbw ymm16, ymm13, [rbx], 10
|
|
vdbpsadbw ymm16, ymm13, [rbx+r11*8+256], 10
|
|
vdbpsadbw ymm16, ymm13, [rbx+r11*8-256], 10
|
|
vdbpsadbw ymm16{k5}, ymm13, ymm15, 10
|
|
vdbpsadbw ymm16{k5}, ymm13, [rbx], 10
|
|
vdbpsadbw ymm16{k5}, ymm13, [rbx+r11*8+256], 10
|
|
vdbpsadbw ymm16{k5}, ymm13, [rbx+r11*8-256], 10
|
|
vdbpsadbw ymm16{k5}{z}, ymm13, ymm15, 10
|
|
vdbpsadbw ymm16{k5}{z}, ymm13, [rbx], 10
|
|
vdbpsadbw ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10
|
|
vdbpsadbw ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10
|
|
vdbpsadbw zmm24, zmm24, zmm31, 10
|
|
vdbpsadbw zmm24, zmm24, [rbx], 10
|
|
vdbpsadbw zmm24, zmm24, [rbx+r11*8+256], 10
|
|
vdbpsadbw zmm24, zmm24, [rbx+r11*8-256], 10
|
|
vdbpsadbw zmm24{k5}, zmm24, zmm31, 10
|
|
vdbpsadbw zmm24{k5}, zmm24, [rbx], 10
|
|
vdbpsadbw zmm24{k5}, zmm24, [rbx+r11*8+256], 10
|
|
vdbpsadbw zmm24{k5}, zmm24, [rbx+r11*8-256], 10
|
|
vdbpsadbw zmm24{k5}{z}, zmm24, zmm31, 10
|
|
vdbpsadbw zmm24{k5}{z}, zmm24, [rbx], 10
|
|
vdbpsadbw zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10
|
|
vdbpsadbw zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10
|
|
vmovdqu16 xmm2, xmm0
|
|
vmovdqu16 xmm2, [rbx]
|
|
vmovdqu16 xmm2, [rbx+r11*8+256]
|
|
vmovdqu16 xmm2, [rbx+r11*8-256]
|
|
vmovdqu16 xmm2{k5}, xmm0
|
|
vmovdqu16 xmm2{k5}, [rbx]
|
|
vmovdqu16 xmm2{k5}, [rbx+r11*8+256]
|
|
vmovdqu16 xmm2{k5}, [rbx+r11*8-256]
|
|
vmovdqu16 xmm2{k5}{z}, xmm0
|
|
vmovdqu16 xmm2{k5}{z}, [rbx]
|
|
vmovdqu16 xmm2{k5}{z}, [rbx+r11*8+256]
|
|
vmovdqu16 xmm2{k5}{z}, [rbx+r11*8-256]
|
|
vmovdqu16 ymm16, ymm15
|
|
vmovdqu16 ymm16, [rbx]
|
|
vmovdqu16 ymm16, [rbx+r11*8+256]
|
|
vmovdqu16 ymm16, [rbx+r11*8-256]
|
|
vmovdqu16 ymm16{k5}, ymm15
|
|
vmovdqu16 ymm16{k5}, [rbx]
|
|
vmovdqu16 ymm16{k5}, [rbx+r11*8+256]
|
|
vmovdqu16 ymm16{k5}, [rbx+r11*8-256]
|
|
vmovdqu16 ymm16{k5}{z}, ymm15
|
|
vmovdqu16 ymm16{k5}{z}, [rbx]
|
|
vmovdqu16 ymm16{k5}{z}, [rbx+r11*8+256]
|
|
vmovdqu16 ymm16{k5}{z}, [rbx+r11*8-256]
|
|
vmovdqu16 zmm24, zmm31
|
|
vmovdqu16 zmm24, [rbx]
|
|
vmovdqu16 zmm24, [rbx+r11*8+256]
|
|
vmovdqu16 zmm24, [rbx+r11*8-256]
|
|
vmovdqu16 zmm24{k5}, zmm31
|
|
vmovdqu16 zmm24{k5}, [rbx]
|
|
vmovdqu16 zmm24{k5}, [rbx+r11*8+256]
|
|
vmovdqu16 zmm24{k5}, [rbx+r11*8-256]
|
|
vmovdqu16 zmm24{k5}{z}, zmm31
|
|
vmovdqu16 zmm24{k5}{z}, [rbx]
|
|
vmovdqu16 zmm24{k5}{z}, [rbx+r11*8+256]
|
|
vmovdqu16 zmm24{k5}{z}, [rbx+r11*8-256]
|
|
vmovdqu16 xmm0, xmm2
|
|
vmovdqu16 ymm15, ymm16
|
|
vmovdqu16 zmm31, zmm24
|
|
vmovdqu16 [rbx], xmm2
|
|
vmovdqu16 [rbx], ymm16
|
|
vmovdqu16 [rbx], zmm24
|
|
vmovdqu16 [rbx+r11*8+256], xmm2
|
|
vmovdqu16 [rbx+r11*8+256], ymm16
|
|
vmovdqu16 [rbx+r11*8+256], zmm24
|
|
vmovdqu16 [rbx+r11*8-256], xmm2
|
|
vmovdqu16 [rbx+r11*8-256], ymm16
|
|
vmovdqu16 [rbx+r11*8-256], zmm24
|
|
vmovdqu8 xmm2, xmm0
|
|
vmovdqu8 xmm2, [rbx]
|
|
vmovdqu8 xmm2, [rbx+r11*8+256]
|
|
vmovdqu8 xmm2, [rbx+r11*8-256]
|
|
vmovdqu8 xmm2{k5}, xmm0
|
|
vmovdqu8 xmm2{k5}, [rbx]
|
|
vmovdqu8 xmm2{k5}, [rbx+r11*8+256]
|
|
vmovdqu8 xmm2{k5}, [rbx+r11*8-256]
|
|
vmovdqu8 xmm2{k5}{z}, xmm0
|
|
vmovdqu8 xmm2{k5}{z}, [rbx]
|
|
vmovdqu8 xmm2{k5}{z}, [rbx+r11*8+256]
|
|
vmovdqu8 xmm2{k5}{z}, [rbx+r11*8-256]
|
|
vmovdqu8 ymm16, ymm15
|
|
vmovdqu8 ymm16, [rbx]
|
|
vmovdqu8 ymm16, [rbx+r11*8+256]
|
|
vmovdqu8 ymm16, [rbx+r11*8-256]
|
|
vmovdqu8 ymm16{k5}, ymm15
|
|
vmovdqu8 ymm16{k5}, [rbx]
|
|
vmovdqu8 ymm16{k5}, [rbx+r11*8+256]
|
|
vmovdqu8 ymm16{k5}, [rbx+r11*8-256]
|
|
vmovdqu8 ymm16{k5}{z}, ymm15
|
|
vmovdqu8 ymm16{k5}{z}, [rbx]
|
|
vmovdqu8 ymm16{k5}{z}, [rbx+r11*8+256]
|
|
vmovdqu8 ymm16{k5}{z}, [rbx+r11*8-256]
|
|
vmovdqu8 zmm24, zmm31
|
|
vmovdqu8 zmm24, [rbx]
|
|
vmovdqu8 zmm24, [rbx+r11*8+256]
|
|
vmovdqu8 zmm24, [rbx+r11*8-256]
|
|
vmovdqu8 zmm24{k5}, zmm31
|
|
vmovdqu8 zmm24{k5}, [rbx]
|
|
vmovdqu8 zmm24{k5}, [rbx+r11*8+256]
|
|
vmovdqu8 zmm24{k5}, [rbx+r11*8-256]
|
|
vmovdqu8 zmm24{k5}{z}, zmm31
|
|
vmovdqu8 zmm24{k5}{z}, [rbx]
|
|
vmovdqu8 zmm24{k5}{z}, [rbx+r11*8+256]
|
|
vmovdqu8 zmm24{k5}{z}, [rbx+r11*8-256]
|
|
vmovdqu8 xmm0, xmm2
|
|
vmovdqu8 ymm15, ymm16
|
|
vmovdqu8 zmm31, zmm24
|
|
vmovdqu8 [rbx], xmm2
|
|
vmovdqu8 [rbx], ymm16
|
|
vmovdqu8 [rbx], zmm24
|
|
vmovdqu8 [rbx+r11*8+256], xmm2
|
|
vmovdqu8 [rbx+r11*8+256], ymm16
|
|
vmovdqu8 [rbx+r11*8+256], zmm24
|
|
vmovdqu8 [rbx+r11*8-256], xmm2
|
|
vmovdqu8 [rbx+r11*8-256], ymm16
|
|
vmovdqu8 [rbx+r11*8-256], zmm24
|
|
vpabsb xmm2, xmm0
|
|
vpabsb xmm2, [rbx]
|
|
vpabsb xmm2, [rbx+r11*8+256]
|
|
vpabsb xmm2, [rbx+r11*8-256]
|
|
vpabsb xmm2{k5}, xmm0
|
|
vpabsb xmm2{k5}, [rbx]
|
|
vpabsb xmm2{k5}, [rbx+r11*8+256]
|
|
vpabsb xmm2{k5}, [rbx+r11*8-256]
|
|
vpabsb xmm2{k5}{z}, xmm0
|
|
vpabsb xmm2{k5}{z}, [rbx]
|
|
vpabsb xmm2{k5}{z}, [rbx+r11*8+256]
|
|
vpabsb xmm2{k5}{z}, [rbx+r11*8-256]
|
|
vpabsb ymm16, ymm15
|
|
vpabsb ymm16, [rbx]
|
|
vpabsb ymm16, [rbx+r11*8+256]
|
|
vpabsb ymm16, [rbx+r11*8-256]
|
|
vpabsb ymm16{k5}, ymm15
|
|
vpabsb ymm16{k5}, [rbx]
|
|
vpabsb ymm16{k5}, [rbx+r11*8+256]
|
|
vpabsb ymm16{k5}, [rbx+r11*8-256]
|
|
vpabsb ymm16{k5}{z}, ymm15
|
|
vpabsb ymm16{k5}{z}, [rbx]
|
|
vpabsb ymm16{k5}{z}, [rbx+r11*8+256]
|
|
vpabsb ymm16{k5}{z}, [rbx+r11*8-256]
|
|
vpabsb zmm24, zmm31
|
|
vpabsb zmm24, [rbx]
|
|
vpabsb zmm24, [rbx+r11*8+256]
|
|
vpabsb zmm24, [rbx+r11*8-256]
|
|
vpabsb zmm24{k5}, zmm31
|
|
vpabsb zmm24{k5}, [rbx]
|
|
vpabsb zmm24{k5}, [rbx+r11*8+256]
|
|
vpabsb zmm24{k5}, [rbx+r11*8-256]
|
|
vpabsb zmm24{k5}{z}, zmm31
|
|
vpabsb zmm24{k5}{z}, [rbx]
|
|
vpabsb zmm24{k5}{z}, [rbx+r11*8+256]
|
|
vpabsb zmm24{k5}{z}, [rbx+r11*8-256]
|
|
vpabsw xmm2, xmm0
|
|
vpabsw xmm2, [rbx]
|
|
vpabsw xmm2, [rbx+r11*8+256]
|
|
vpabsw xmm2, [rbx+r11*8-256]
|
|
vpabsw xmm2{k5}, xmm0
|
|
vpabsw xmm2{k5}, [rbx]
|
|
vpabsw xmm2{k5}, [rbx+r11*8+256]
|
|
vpabsw xmm2{k5}, [rbx+r11*8-256]
|
|
vpabsw xmm2{k5}{z}, xmm0
|
|
vpabsw xmm2{k5}{z}, [rbx]
|
|
vpabsw xmm2{k5}{z}, [rbx+r11*8+256]
|
|
vpabsw xmm2{k5}{z}, [rbx+r11*8-256]
|
|
vpabsw ymm16, ymm15
|
|
vpabsw ymm16, [rbx]
|
|
vpabsw ymm16, [rbx+r11*8+256]
|
|
vpabsw ymm16, [rbx+r11*8-256]
|
|
vpabsw ymm16{k5}, ymm15
|
|
vpabsw ymm16{k5}, [rbx]
|
|
vpabsw ymm16{k5}, [rbx+r11*8+256]
|
|
vpabsw ymm16{k5}, [rbx+r11*8-256]
|
|
vpabsw ymm16{k5}{z}, ymm15
|
|
vpabsw ymm16{k5}{z}, [rbx]
|
|
vpabsw ymm16{k5}{z}, [rbx+r11*8+256]
|
|
vpabsw ymm16{k5}{z}, [rbx+r11*8-256]
|
|
vpabsw zmm24, zmm31
|
|
vpabsw zmm24, [rbx]
|
|
vpabsw zmm24, [rbx+r11*8+256]
|
|
vpabsw zmm24, [rbx+r11*8-256]
|
|
vpabsw zmm24{k5}, zmm31
|
|
vpabsw zmm24{k5}, [rbx]
|
|
vpabsw zmm24{k5}, [rbx+r11*8+256]
|
|
vpabsw zmm24{k5}, [rbx+r11*8-256]
|
|
vpabsw zmm24{k5}{z}, zmm31
|
|
vpabsw zmm24{k5}{z}, [rbx]
|
|
vpabsw zmm24{k5}{z}, [rbx+r11*8+256]
|
|
vpabsw zmm24{k5}{z}, [rbx+r11*8-256]
|
|
vpackssdw xmm2, xmm7, xmm0
|
|
vpackssdw xmm2, xmm7, [rbx]
|
|
vpackssdw xmm2, xmm7, [rbx]{1to4}
|
|
vpackssdw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpackssdw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpackssdw xmm2{k5}, xmm7, xmm0
|
|
vpackssdw xmm2{k5}, xmm7, [rbx]
|
|
vpackssdw xmm2{k5}, xmm7, [rbx]{1to4}
|
|
vpackssdw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpackssdw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpackssdw xmm2{k5}{z}, xmm7, xmm0
|
|
vpackssdw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpackssdw xmm2{k5}{z}, xmm7, [rbx]{1to4}
|
|
vpackssdw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpackssdw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpackssdw ymm16, ymm13, ymm15
|
|
vpackssdw ymm16, ymm13, [rbx]
|
|
vpackssdw ymm16, ymm13, [rbx]{1to8}
|
|
vpackssdw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpackssdw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpackssdw ymm16{k5}, ymm13, ymm15
|
|
vpackssdw ymm16{k5}, ymm13, [rbx]
|
|
vpackssdw ymm16{k5}, ymm13, [rbx]{1to8}
|
|
vpackssdw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpackssdw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpackssdw ymm16{k5}{z}, ymm13, ymm15
|
|
vpackssdw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpackssdw ymm16{k5}{z}, ymm13, [rbx]{1to8}
|
|
vpackssdw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpackssdw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpackssdw zmm24, zmm24, zmm31
|
|
vpackssdw zmm24, zmm24, [rbx]
|
|
vpackssdw zmm24, zmm24, [rbx]{1to16}
|
|
vpackssdw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpackssdw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpackssdw zmm24{k5}, zmm24, zmm31
|
|
vpackssdw zmm24{k5}, zmm24, [rbx]
|
|
vpackssdw zmm24{k5}, zmm24, [rbx]{1to16}
|
|
vpackssdw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpackssdw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpackssdw zmm24{k5}{z}, zmm24, zmm31
|
|
vpackssdw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpackssdw zmm24{k5}{z}, zmm24, [rbx]{1to16}
|
|
vpackssdw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpackssdw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpacksswb xmm2, xmm7, xmm0
|
|
vpacksswb xmm2, xmm7, [rbx]
|
|
vpacksswb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpacksswb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpacksswb xmm2{k5}, xmm7, xmm0
|
|
vpacksswb xmm2{k5}, xmm7, [rbx]
|
|
vpacksswb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpacksswb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpacksswb xmm2{k5}{z}, xmm7, xmm0
|
|
vpacksswb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpacksswb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpacksswb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpacksswb ymm16, ymm13, ymm15
|
|
vpacksswb ymm16, ymm13, [rbx]
|
|
vpacksswb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpacksswb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpacksswb ymm16{k5}, ymm13, ymm15
|
|
vpacksswb ymm16{k5}, ymm13, [rbx]
|
|
vpacksswb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpacksswb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpacksswb ymm16{k5}{z}, ymm13, ymm15
|
|
vpacksswb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpacksswb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpacksswb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpacksswb zmm24, zmm24, zmm31
|
|
vpacksswb zmm24, zmm24, [rbx]
|
|
vpacksswb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpacksswb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpacksswb zmm24{k5}, zmm24, zmm31
|
|
vpacksswb zmm24{k5}, zmm24, [rbx]
|
|
vpacksswb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpacksswb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpacksswb zmm24{k5}{z}, zmm24, zmm31
|
|
vpacksswb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpacksswb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpacksswb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpackusdw xmm2, xmm7, xmm0
|
|
vpackusdw xmm2, xmm7, [rbx]
|
|
vpackusdw xmm2, xmm7, [rbx]{1to4}
|
|
vpackusdw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpackusdw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpackusdw xmm2{k5}, xmm7, xmm0
|
|
vpackusdw xmm2{k5}, xmm7, [rbx]
|
|
vpackusdw xmm2{k5}, xmm7, [rbx]{1to4}
|
|
vpackusdw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpackusdw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpackusdw xmm2{k5}{z}, xmm7, xmm0
|
|
vpackusdw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpackusdw xmm2{k5}{z}, xmm7, [rbx]{1to4}
|
|
vpackusdw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpackusdw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpackusdw ymm16, ymm13, ymm15
|
|
vpackusdw ymm16, ymm13, [rbx]
|
|
vpackusdw ymm16, ymm13, [rbx]{1to8}
|
|
vpackusdw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpackusdw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpackusdw ymm16{k5}, ymm13, ymm15
|
|
vpackusdw ymm16{k5}, ymm13, [rbx]
|
|
vpackusdw ymm16{k5}, ymm13, [rbx]{1to8}
|
|
vpackusdw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpackusdw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpackusdw ymm16{k5}{z}, ymm13, ymm15
|
|
vpackusdw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpackusdw ymm16{k5}{z}, ymm13, [rbx]{1to8}
|
|
vpackusdw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpackusdw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpackusdw zmm24, zmm24, zmm31
|
|
vpackusdw zmm24, zmm24, [rbx]
|
|
vpackusdw zmm24, zmm24, [rbx]{1to16}
|
|
vpackusdw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpackusdw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpackusdw zmm24{k5}, zmm24, zmm31
|
|
vpackusdw zmm24{k5}, zmm24, [rbx]
|
|
vpackusdw zmm24{k5}, zmm24, [rbx]{1to16}
|
|
vpackusdw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpackusdw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpackusdw zmm24{k5}{z}, zmm24, zmm31
|
|
vpackusdw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpackusdw zmm24{k5}{z}, zmm24, [rbx]{1to16}
|
|
vpackusdw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpackusdw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpackuswb xmm2, xmm7, xmm0
|
|
vpackuswb xmm2, xmm7, [rbx]
|
|
vpackuswb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpackuswb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpackuswb xmm2{k5}, xmm7, xmm0
|
|
vpackuswb xmm2{k5}, xmm7, [rbx]
|
|
vpackuswb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpackuswb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpackuswb xmm2{k5}{z}, xmm7, xmm0
|
|
vpackuswb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpackuswb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpackuswb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpackuswb ymm16, ymm13, ymm15
|
|
vpackuswb ymm16, ymm13, [rbx]
|
|
vpackuswb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpackuswb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpackuswb ymm16{k5}, ymm13, ymm15
|
|
vpackuswb ymm16{k5}, ymm13, [rbx]
|
|
vpackuswb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpackuswb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpackuswb ymm16{k5}{z}, ymm13, ymm15
|
|
vpackuswb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpackuswb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpackuswb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpackuswb zmm24, zmm24, zmm31
|
|
vpackuswb zmm24, zmm24, [rbx]
|
|
vpackuswb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpackuswb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpackuswb zmm24{k5}, zmm24, zmm31
|
|
vpackuswb zmm24{k5}, zmm24, [rbx]
|
|
vpackuswb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpackuswb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpackuswb zmm24{k5}{z}, zmm24, zmm31
|
|
vpackuswb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpackuswb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpackuswb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpaddb xmm2, xmm7, xmm0
|
|
vpaddb xmm2, xmm7, [rbx]
|
|
vpaddb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpaddb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpaddb xmm2{k5}, xmm7, xmm0
|
|
vpaddb xmm2{k5}, xmm7, [rbx]
|
|
vpaddb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpaddb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpaddb xmm2{k5}{z}, xmm7, xmm0
|
|
vpaddb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpaddb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpaddb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpaddb ymm16, ymm13, ymm15
|
|
vpaddb ymm16, ymm13, [rbx]
|
|
vpaddb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpaddb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpaddb ymm16{k5}, ymm13, ymm15
|
|
vpaddb ymm16{k5}, ymm13, [rbx]
|
|
vpaddb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpaddb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpaddb ymm16{k5}{z}, ymm13, ymm15
|
|
vpaddb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpaddb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpaddb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpaddb zmm24, zmm24, zmm31
|
|
vpaddb zmm24, zmm24, [rbx]
|
|
vpaddb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpaddb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpaddb zmm24{k5}, zmm24, zmm31
|
|
vpaddb zmm24{k5}, zmm24, [rbx]
|
|
vpaddb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpaddb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpaddb zmm24{k5}{z}, zmm24, zmm31
|
|
vpaddb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpaddb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpaddb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpaddsb xmm2, xmm7, xmm0
|
|
vpaddsb xmm2, xmm7, [rbx]
|
|
vpaddsb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpaddsb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpaddsb xmm2{k5}, xmm7, xmm0
|
|
vpaddsb xmm2{k5}, xmm7, [rbx]
|
|
vpaddsb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpaddsb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpaddsb xmm2{k5}{z}, xmm7, xmm0
|
|
vpaddsb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpaddsb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpaddsb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpaddsb ymm16, ymm13, ymm15
|
|
vpaddsb ymm16, ymm13, [rbx]
|
|
vpaddsb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpaddsb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpaddsb ymm16{k5}, ymm13, ymm15
|
|
vpaddsb ymm16{k5}, ymm13, [rbx]
|
|
vpaddsb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpaddsb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpaddsb ymm16{k5}{z}, ymm13, ymm15
|
|
vpaddsb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpaddsb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpaddsb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpaddsb zmm24, zmm24, zmm31
|
|
vpaddsb zmm24, zmm24, [rbx]
|
|
vpaddsb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpaddsb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpaddsb zmm24{k5}, zmm24, zmm31
|
|
vpaddsb zmm24{k5}, zmm24, [rbx]
|
|
vpaddsb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpaddsb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpaddsb zmm24{k5}{z}, zmm24, zmm31
|
|
vpaddsb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpaddsb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpaddsb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpaddsw xmm2, xmm7, xmm0
|
|
vpaddsw xmm2, xmm7, [rbx]
|
|
vpaddsw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpaddsw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpaddsw xmm2{k5}, xmm7, xmm0
|
|
vpaddsw xmm2{k5}, xmm7, [rbx]
|
|
vpaddsw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpaddsw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpaddsw xmm2{k5}{z}, xmm7, xmm0
|
|
vpaddsw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpaddsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpaddsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpaddsw ymm16, ymm13, ymm15
|
|
vpaddsw ymm16, ymm13, [rbx]
|
|
vpaddsw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpaddsw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpaddsw ymm16{k5}, ymm13, ymm15
|
|
vpaddsw ymm16{k5}, ymm13, [rbx]
|
|
vpaddsw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpaddsw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpaddsw ymm16{k5}{z}, ymm13, ymm15
|
|
vpaddsw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpaddsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpaddsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpaddsw zmm24, zmm24, zmm31
|
|
vpaddsw zmm24, zmm24, [rbx]
|
|
vpaddsw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpaddsw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpaddsw zmm24{k5}, zmm24, zmm31
|
|
vpaddsw zmm24{k5}, zmm24, [rbx]
|
|
vpaddsw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpaddsw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpaddsw zmm24{k5}{z}, zmm24, zmm31
|
|
vpaddsw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpaddsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpaddsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpaddusb xmm2, xmm7, xmm0
|
|
vpaddusb xmm2, xmm7, [rbx]
|
|
vpaddusb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpaddusb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpaddusb xmm2{k5}, xmm7, xmm0
|
|
vpaddusb xmm2{k5}, xmm7, [rbx]
|
|
vpaddusb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpaddusb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpaddusb xmm2{k5}{z}, xmm7, xmm0
|
|
vpaddusb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpaddusb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpaddusb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpaddusb ymm16, ymm13, ymm15
|
|
vpaddusb ymm16, ymm13, [rbx]
|
|
vpaddusb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpaddusb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpaddusb ymm16{k5}, ymm13, ymm15
|
|
vpaddusb ymm16{k5}, ymm13, [rbx]
|
|
vpaddusb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpaddusb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpaddusb ymm16{k5}{z}, ymm13, ymm15
|
|
vpaddusb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpaddusb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpaddusb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpaddusb zmm24, zmm24, zmm31
|
|
vpaddusb zmm24, zmm24, [rbx]
|
|
vpaddusb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpaddusb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpaddusb zmm24{k5}, zmm24, zmm31
|
|
vpaddusb zmm24{k5}, zmm24, [rbx]
|
|
vpaddusb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpaddusb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpaddusb zmm24{k5}{z}, zmm24, zmm31
|
|
vpaddusb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpaddusb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpaddusb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpaddusw xmm2, xmm7, xmm0
|
|
vpaddusw xmm2, xmm7, [rbx]
|
|
vpaddusw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpaddusw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpaddusw xmm2{k5}, xmm7, xmm0
|
|
vpaddusw xmm2{k5}, xmm7, [rbx]
|
|
vpaddusw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpaddusw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpaddusw xmm2{k5}{z}, xmm7, xmm0
|
|
vpaddusw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpaddusw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpaddusw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpaddusw ymm16, ymm13, ymm15
|
|
vpaddusw ymm16, ymm13, [rbx]
|
|
vpaddusw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpaddusw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpaddusw ymm16{k5}, ymm13, ymm15
|
|
vpaddusw ymm16{k5}, ymm13, [rbx]
|
|
vpaddusw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpaddusw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpaddusw ymm16{k5}{z}, ymm13, ymm15
|
|
vpaddusw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpaddusw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpaddusw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpaddusw zmm24, zmm24, zmm31
|
|
vpaddusw zmm24, zmm24, [rbx]
|
|
vpaddusw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpaddusw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpaddusw zmm24{k5}, zmm24, zmm31
|
|
vpaddusw zmm24{k5}, zmm24, [rbx]
|
|
vpaddusw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpaddusw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpaddusw zmm24{k5}{z}, zmm24, zmm31
|
|
vpaddusw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpaddusw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpaddusw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpaddw xmm2, xmm7, xmm0
|
|
vpaddw xmm2, xmm7, [rbx]
|
|
vpaddw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpaddw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpaddw xmm2{k5}, xmm7, xmm0
|
|
vpaddw xmm2{k5}, xmm7, [rbx]
|
|
vpaddw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpaddw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpaddw xmm2{k5}{z}, xmm7, xmm0
|
|
vpaddw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpaddw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpaddw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpaddw ymm16, ymm13, ymm15
|
|
vpaddw ymm16, ymm13, [rbx]
|
|
vpaddw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpaddw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpaddw ymm16{k5}, ymm13, ymm15
|
|
vpaddw ymm16{k5}, ymm13, [rbx]
|
|
vpaddw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpaddw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpaddw ymm16{k5}{z}, ymm13, ymm15
|
|
vpaddw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpaddw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpaddw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpaddw zmm24, zmm24, zmm31
|
|
vpaddw zmm24, zmm24, [rbx]
|
|
vpaddw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpaddw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpaddw zmm24{k5}, zmm24, zmm31
|
|
vpaddw zmm24{k5}, zmm24, [rbx]
|
|
vpaddw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpaddw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpaddw zmm24{k5}{z}, zmm24, zmm31
|
|
vpaddw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpaddw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpaddw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpalignr xmm2, xmm7, xmm0, 10
|
|
vpalignr xmm2, xmm7, [rbx], 10
|
|
vpalignr xmm2, xmm7, [rbx+r11*8+256], 10
|
|
vpalignr xmm2, xmm7, [rbx+r11*8-256], 10
|
|
vpalignr xmm2{k5}, xmm7, xmm0, 10
|
|
vpalignr xmm2{k5}, xmm7, [rbx], 10
|
|
vpalignr xmm2{k5}, xmm7, [rbx+r11*8+256], 10
|
|
vpalignr xmm2{k5}, xmm7, [rbx+r11*8-256], 10
|
|
vpalignr xmm2{k5}{z}, xmm7, xmm0, 10
|
|
vpalignr xmm2{k5}{z}, xmm7, [rbx], 10
|
|
vpalignr xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10
|
|
vpalignr xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10
|
|
vpalignr ymm16, ymm13, ymm15, 10
|
|
vpalignr ymm16, ymm13, [rbx], 10
|
|
vpalignr ymm16, ymm13, [rbx+r11*8+256], 10
|
|
vpalignr ymm16, ymm13, [rbx+r11*8-256], 10
|
|
vpalignr ymm16{k5}, ymm13, ymm15, 10
|
|
vpalignr ymm16{k5}, ymm13, [rbx], 10
|
|
vpalignr ymm16{k5}, ymm13, [rbx+r11*8+256], 10
|
|
vpalignr ymm16{k5}, ymm13, [rbx+r11*8-256], 10
|
|
vpalignr ymm16{k5}{z}, ymm13, ymm15, 10
|
|
vpalignr ymm16{k5}{z}, ymm13, [rbx], 10
|
|
vpalignr ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10
|
|
vpalignr ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10
|
|
vpalignr zmm24, zmm24, zmm31, 10
|
|
vpalignr zmm24, zmm24, [rbx], 10
|
|
vpalignr zmm24, zmm24, [rbx+r11*8+256], 10
|
|
vpalignr zmm24, zmm24, [rbx+r11*8-256], 10
|
|
vpalignr zmm24{k5}, zmm24, zmm31, 10
|
|
vpalignr zmm24{k5}, zmm24, [rbx], 10
|
|
vpalignr zmm24{k5}, zmm24, [rbx+r11*8+256], 10
|
|
vpalignr zmm24{k5}, zmm24, [rbx+r11*8-256], 10
|
|
vpalignr zmm24{k5}{z}, zmm24, zmm31, 10
|
|
vpalignr zmm24{k5}{z}, zmm24, [rbx], 10
|
|
vpalignr zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10
|
|
vpalignr zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10
|
|
vpavgb xmm2, xmm7, xmm0
|
|
vpavgb xmm2, xmm7, [rbx]
|
|
vpavgb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpavgb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpavgb xmm2{k5}, xmm7, xmm0
|
|
vpavgb xmm2{k5}, xmm7, [rbx]
|
|
vpavgb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpavgb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpavgb xmm2{k5}{z}, xmm7, xmm0
|
|
vpavgb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpavgb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpavgb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpavgb ymm16, ymm13, ymm15
|
|
vpavgb ymm16, ymm13, [rbx]
|
|
vpavgb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpavgb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpavgb ymm16{k5}, ymm13, ymm15
|
|
vpavgb ymm16{k5}, ymm13, [rbx]
|
|
vpavgb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpavgb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpavgb ymm16{k5}{z}, ymm13, ymm15
|
|
vpavgb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpavgb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpavgb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpavgb zmm24, zmm24, zmm31
|
|
vpavgb zmm24, zmm24, [rbx]
|
|
vpavgb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpavgb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpavgb zmm24{k5}, zmm24, zmm31
|
|
vpavgb zmm24{k5}, zmm24, [rbx]
|
|
vpavgb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpavgb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpavgb zmm24{k5}{z}, zmm24, zmm31
|
|
vpavgb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpavgb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpavgb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpavgw xmm2, xmm7, xmm0
|
|
vpavgw xmm2, xmm7, [rbx]
|
|
vpavgw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpavgw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpavgw xmm2{k5}, xmm7, xmm0
|
|
vpavgw xmm2{k5}, xmm7, [rbx]
|
|
vpavgw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpavgw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpavgw xmm2{k5}{z}, xmm7, xmm0
|
|
vpavgw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpavgw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpavgw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpavgw ymm16, ymm13, ymm15
|
|
vpavgw ymm16, ymm13, [rbx]
|
|
vpavgw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpavgw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpavgw ymm16{k5}, ymm13, ymm15
|
|
vpavgw ymm16{k5}, ymm13, [rbx]
|
|
vpavgw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpavgw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpavgw ymm16{k5}{z}, ymm13, ymm15
|
|
vpavgw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpavgw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpavgw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpavgw zmm24, zmm24, zmm31
|
|
vpavgw zmm24, zmm24, [rbx]
|
|
vpavgw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpavgw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpavgw zmm24{k5}, zmm24, zmm31
|
|
vpavgw zmm24{k5}, zmm24, [rbx]
|
|
vpavgw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpavgw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpavgw zmm24{k5}{z}, zmm24, zmm31
|
|
vpavgw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpavgw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpavgw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpblendmb xmm2, xmm7, xmm0
|
|
vpblendmb xmm2, xmm7, [rbx]
|
|
vpblendmb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpblendmb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpblendmb xmm2{k5}, xmm7, xmm0
|
|
vpblendmb xmm2{k5}, xmm7, [rbx]
|
|
vpblendmb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpblendmb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpblendmb xmm2{k5}{z}, xmm7, xmm0
|
|
vpblendmb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpblendmb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpblendmb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpblendmb ymm16, ymm13, ymm15
|
|
vpblendmb ymm16, ymm13, [rbx]
|
|
vpblendmb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpblendmb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpblendmb ymm16{k5}, ymm13, ymm15
|
|
vpblendmb ymm16{k5}, ymm13, [rbx]
|
|
vpblendmb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpblendmb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpblendmb ymm16{k5}{z}, ymm13, ymm15
|
|
vpblendmb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpblendmb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpblendmb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpblendmb zmm24, zmm24, zmm31
|
|
vpblendmb zmm24, zmm24, [rbx]
|
|
vpblendmb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpblendmb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpblendmb zmm24{k5}, zmm24, zmm31
|
|
vpblendmb zmm24{k5}, zmm24, [rbx]
|
|
vpblendmb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpblendmb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpblendmb zmm24{k5}{z}, zmm24, zmm31
|
|
vpblendmb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpblendmb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpblendmb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpblendmw xmm2, xmm7, xmm0
|
|
vpblendmw xmm2, xmm7, [rbx]
|
|
vpblendmw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpblendmw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpblendmw xmm2{k5}, xmm7, xmm0
|
|
vpblendmw xmm2{k5}, xmm7, [rbx]
|
|
vpblendmw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpblendmw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpblendmw xmm2{k5}{z}, xmm7, xmm0
|
|
vpblendmw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpblendmw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpblendmw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpblendmw ymm16, ymm13, ymm15
|
|
vpblendmw ymm16, ymm13, [rbx]
|
|
vpblendmw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpblendmw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpblendmw ymm16{k5}, ymm13, ymm15
|
|
vpblendmw ymm16{k5}, ymm13, [rbx]
|
|
vpblendmw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpblendmw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpblendmw ymm16{k5}{z}, ymm13, ymm15
|
|
vpblendmw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpblendmw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpblendmw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpblendmw zmm24, zmm24, zmm31
|
|
vpblendmw zmm24, zmm24, [rbx]
|
|
vpblendmw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpblendmw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpblendmw zmm24{k5}, zmm24, zmm31
|
|
vpblendmw zmm24{k5}, zmm24, [rbx]
|
|
vpblendmw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpblendmw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpblendmw zmm24{k5}{z}, zmm24, zmm31
|
|
vpblendmw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpblendmw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpblendmw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpbroadcastb xmm2, xmm0
|
|
vpbroadcastb xmm2, [rbx]
|
|
vpbroadcastb xmm2, [rbx+r11*8+256]
|
|
vpbroadcastb xmm2, [rbx+r11*8-256]
|
|
vpbroadcastb xmm2{k5}, xmm0
|
|
vpbroadcastb xmm2{k5}, [rbx]
|
|
vpbroadcastb xmm2{k5}, [rbx+r11*8+256]
|
|
vpbroadcastb xmm2{k5}, [rbx+r11*8-256]
|
|
vpbroadcastb xmm2{k5}{z}, xmm0
|
|
vpbroadcastb xmm2{k5}{z}, [rbx]
|
|
vpbroadcastb xmm2{k5}{z}, [rbx+r11*8+256]
|
|
vpbroadcastb xmm2{k5}{z}, [rbx+r11*8-256]
|
|
vpbroadcastb ymm16, xmm0
|
|
vpbroadcastb ymm16, [rbx]
|
|
vpbroadcastb ymm16, [rbx+r11*8+256]
|
|
vpbroadcastb ymm16, [rbx+r11*8-256]
|
|
vpbroadcastb ymm16{k5}, xmm0
|
|
vpbroadcastb ymm16{k5}, [rbx]
|
|
vpbroadcastb ymm16{k5}, [rbx+r11*8+256]
|
|
vpbroadcastb ymm16{k5}, [rbx+r11*8-256]
|
|
vpbroadcastb ymm16{k5}{z}, xmm0
|
|
vpbroadcastb ymm16{k5}{z}, [rbx]
|
|
vpbroadcastb ymm16{k5}{z}, [rbx+r11*8+256]
|
|
vpbroadcastb ymm16{k5}{z}, [rbx+r11*8-256]
|
|
vpbroadcastb zmm24, xmm0
|
|
vpbroadcastb zmm24, [rbx]
|
|
vpbroadcastb zmm24, [rbx+r11*8+256]
|
|
vpbroadcastb zmm24, [rbx+r11*8-256]
|
|
vpbroadcastb zmm24{k5}, xmm0
|
|
vpbroadcastb zmm24{k5}, [rbx]
|
|
vpbroadcastb zmm24{k5}, [rbx+r11*8+256]
|
|
vpbroadcastb zmm24{k5}, [rbx+r11*8-256]
|
|
vpbroadcastb zmm24{k5}{z}, xmm0
|
|
vpbroadcastb zmm24{k5}{z}, [rbx]
|
|
vpbroadcastb zmm24{k5}{z}, [rbx+r11*8+256]
|
|
vpbroadcastb zmm24{k5}{z}, [rbx+r11*8-256]
|
|
vpbroadcastb xmm2, cl
|
|
vpbroadcastb xmm2, cx
|
|
vpbroadcastb xmm2, ecx
|
|
vpbroadcastb xmm2, rcx
|
|
vpbroadcastb xmm2{k5}, cl
|
|
vpbroadcastb xmm2{k5}, cx
|
|
vpbroadcastb xmm2{k5}, ecx
|
|
vpbroadcastb xmm2{k5}, rcx
|
|
vpbroadcastb xmm2{k5}{z}, cl
|
|
vpbroadcastb xmm2{k5}{z}, cx
|
|
vpbroadcastb xmm2{k5}{z}, ecx
|
|
vpbroadcastb xmm2{k5}{z}, rcx
|
|
vpbroadcastb ymm16, cl
|
|
vpbroadcastb ymm16, cx
|
|
vpbroadcastb ymm16, ecx
|
|
vpbroadcastb ymm16, rcx
|
|
vpbroadcastb ymm16{k5}, cl
|
|
vpbroadcastb ymm16{k5}, cx
|
|
vpbroadcastb ymm16{k5}, ecx
|
|
vpbroadcastb ymm16{k5}, rcx
|
|
vpbroadcastb ymm16{k5}{z}, cl
|
|
vpbroadcastb ymm16{k5}{z}, cx
|
|
vpbroadcastb ymm16{k5}{z}, ecx
|
|
vpbroadcastb ymm16{k5}{z}, rcx
|
|
vpbroadcastb zmm24, cl
|
|
vpbroadcastb zmm24, cx
|
|
vpbroadcastb zmm24, ecx
|
|
vpbroadcastb zmm24, rcx
|
|
vpbroadcastb zmm24{k5}, cl
|
|
vpbroadcastb zmm24{k5}, cx
|
|
vpbroadcastb zmm24{k5}, ecx
|
|
vpbroadcastb zmm24{k5}, rcx
|
|
vpbroadcastb zmm24{k5}{z}, cl
|
|
vpbroadcastb zmm24{k5}{z}, cx
|
|
vpbroadcastb zmm24{k5}{z}, ecx
|
|
vpbroadcastb zmm24{k5}{z}, rcx
|
|
vpbroadcastw xmm2, xmm0
|
|
vpbroadcastw xmm2, [rbx]
|
|
vpbroadcastw xmm2, [rbx+r11*8+256]
|
|
vpbroadcastw xmm2, [rbx+r11*8-256]
|
|
vpbroadcastw xmm2{k5}, xmm0
|
|
vpbroadcastw xmm2{k5}, [rbx]
|
|
vpbroadcastw xmm2{k5}, [rbx+r11*8+256]
|
|
vpbroadcastw xmm2{k5}, [rbx+r11*8-256]
|
|
vpbroadcastw xmm2{k5}{z}, xmm0
|
|
vpbroadcastw xmm2{k5}{z}, [rbx]
|
|
vpbroadcastw xmm2{k5}{z}, [rbx+r11*8+256]
|
|
vpbroadcastw xmm2{k5}{z}, [rbx+r11*8-256]
|
|
vpbroadcastw ymm16, xmm0
|
|
vpbroadcastw ymm16, [rbx]
|
|
vpbroadcastw ymm16, [rbx+r11*8+256]
|
|
vpbroadcastw ymm16, [rbx+r11*8-256]
|
|
vpbroadcastw ymm16{k5}, xmm0
|
|
vpbroadcastw ymm16{k5}, [rbx]
|
|
vpbroadcastw ymm16{k5}, [rbx+r11*8+256]
|
|
vpbroadcastw ymm16{k5}, [rbx+r11*8-256]
|
|
vpbroadcastw ymm16{k5}{z}, xmm0
|
|
vpbroadcastw ymm16{k5}{z}, [rbx]
|
|
vpbroadcastw ymm16{k5}{z}, [rbx+r11*8+256]
|
|
vpbroadcastw ymm16{k5}{z}, [rbx+r11*8-256]
|
|
vpbroadcastw zmm24, xmm0
|
|
vpbroadcastw zmm24, [rbx]
|
|
vpbroadcastw zmm24, [rbx+r11*8+256]
|
|
vpbroadcastw zmm24, [rbx+r11*8-256]
|
|
vpbroadcastw zmm24{k5}, xmm0
|
|
vpbroadcastw zmm24{k5}, [rbx]
|
|
vpbroadcastw zmm24{k5}, [rbx+r11*8+256]
|
|
vpbroadcastw zmm24{k5}, [rbx+r11*8-256]
|
|
vpbroadcastw zmm24{k5}{z}, xmm0
|
|
vpbroadcastw zmm24{k5}{z}, [rbx]
|
|
vpbroadcastw zmm24{k5}{z}, [rbx+r11*8+256]
|
|
vpbroadcastw zmm24{k5}{z}, [rbx+r11*8-256]
|
|
vpbroadcastw xmm2, cx
|
|
vpbroadcastw xmm2, ecx
|
|
vpbroadcastw xmm2, rcx
|
|
vpbroadcastw xmm2{k5}, cx
|
|
vpbroadcastw xmm2{k5}, ecx
|
|
vpbroadcastw xmm2{k5}, rcx
|
|
vpbroadcastw xmm2{k5}{z}, cx
|
|
vpbroadcastw xmm2{k5}{z}, ecx
|
|
vpbroadcastw xmm2{k5}{z}, rcx
|
|
vpbroadcastw ymm16, cx
|
|
vpbroadcastw ymm16, ecx
|
|
vpbroadcastw ymm16, rcx
|
|
vpbroadcastw ymm16{k5}, cx
|
|
vpbroadcastw ymm16{k5}, ecx
|
|
vpbroadcastw ymm16{k5}, rcx
|
|
vpbroadcastw ymm16{k5}{z}, cx
|
|
vpbroadcastw ymm16{k5}{z}, ecx
|
|
vpbroadcastw ymm16{k5}{z}, rcx
|
|
vpbroadcastw zmm24, cx
|
|
vpbroadcastw zmm24, ecx
|
|
vpbroadcastw zmm24, rcx
|
|
vpbroadcastw zmm24{k5}, cx
|
|
vpbroadcastw zmm24{k5}, ecx
|
|
vpbroadcastw zmm24{k5}, rcx
|
|
vpbroadcastw zmm24{k5}{z}, cx
|
|
vpbroadcastw zmm24{k5}{z}, ecx
|
|
vpbroadcastw zmm24{k5}{z}, rcx
|
|
vpcmpb k3, xmm7, xmm0, 10
|
|
vpcmpb k3, xmm7, [rbx], 10
|
|
vpcmpb k3, xmm7, [rbx+r11*8+256], 10
|
|
vpcmpb k3, xmm7, [rbx+r11*8-256], 10
|
|
vpcmpb k3, ymm13, ymm15, 10
|
|
vpcmpb k3, ymm13, [rbx], 10
|
|
vpcmpb k3, ymm13, [rbx+r11*8+256], 10
|
|
vpcmpb k3, ymm13, [rbx+r11*8-256], 10
|
|
vpcmpb k3, zmm24, zmm31, 10
|
|
vpcmpb k3, zmm24, [rbx], 10
|
|
vpcmpb k3, zmm24, [rbx+r11*8+256], 10
|
|
vpcmpb k3, zmm24, [rbx+r11*8-256], 10
|
|
vpcmpb k3{k5}, xmm7, xmm0, 10
|
|
vpcmpb k3{k5}, xmm7, [rbx], 10
|
|
vpcmpb k3{k5}, xmm7, [rbx+r11*8+256], 10
|
|
vpcmpb k3{k5}, xmm7, [rbx+r11*8-256], 10
|
|
vpcmpb k3{k5}, ymm13, ymm15, 10
|
|
vpcmpb k3{k5}, ymm13, [rbx], 10
|
|
vpcmpb k3{k5}, ymm13, [rbx+r11*8+256], 10
|
|
vpcmpb k3{k5}, ymm13, [rbx+r11*8-256], 10
|
|
vpcmpb k3{k5}, zmm24, zmm31, 10
|
|
vpcmpb k3{k5}, zmm24, [rbx], 10
|
|
vpcmpb k3{k5}, zmm24, [rbx+r11*8+256], 10
|
|
vpcmpb k3{k5}, zmm24, [rbx+r11*8-256], 10
|
|
vpcmpeqb k3, xmm7, xmm0
|
|
vpcmpeqb k3, xmm7, [rbx]
|
|
vpcmpeqb k3, xmm7, [rbx+r11*8+256]
|
|
vpcmpeqb k3, xmm7, [rbx+r11*8-256]
|
|
vpcmpeqb k3, ymm13, ymm15
|
|
vpcmpeqb k3, ymm13, [rbx]
|
|
vpcmpeqb k3, ymm13, [rbx+r11*8+256]
|
|
vpcmpeqb k3, ymm13, [rbx+r11*8-256]
|
|
vpcmpeqb k3, zmm24, zmm31
|
|
vpcmpeqb k3, zmm24, [rbx]
|
|
vpcmpeqb k3, zmm24, [rbx+r11*8+256]
|
|
vpcmpeqb k3, zmm24, [rbx+r11*8-256]
|
|
vpcmpeqb k3{k5}, xmm7, xmm0
|
|
vpcmpeqb k3{k5}, xmm7, [rbx]
|
|
vpcmpeqb k3{k5}, xmm7, [rbx+r11*8+256]
|
|
vpcmpeqb k3{k5}, xmm7, [rbx+r11*8-256]
|
|
vpcmpeqb k3{k5}, ymm13, ymm15
|
|
vpcmpeqb k3{k5}, ymm13, [rbx]
|
|
vpcmpeqb k3{k5}, ymm13, [rbx+r11*8+256]
|
|
vpcmpeqb k3{k5}, ymm13, [rbx+r11*8-256]
|
|
vpcmpeqb k3{k5}, zmm24, zmm31
|
|
vpcmpeqb k3{k5}, zmm24, [rbx]
|
|
vpcmpeqb k3{k5}, zmm24, [rbx+r11*8+256]
|
|
vpcmpeqb k3{k5}, zmm24, [rbx+r11*8-256]
|
|
vpcmpeqw k3, xmm7, xmm0
|
|
vpcmpeqw k3, xmm7, [rbx]
|
|
vpcmpeqw k3, xmm7, [rbx+r11*8+256]
|
|
vpcmpeqw k3, xmm7, [rbx+r11*8-256]
|
|
vpcmpeqw k3, ymm13, ymm15
|
|
vpcmpeqw k3, ymm13, [rbx]
|
|
vpcmpeqw k3, ymm13, [rbx+r11*8+256]
|
|
vpcmpeqw k3, ymm13, [rbx+r11*8-256]
|
|
vpcmpeqw k3, zmm24, zmm31
|
|
vpcmpeqw k3, zmm24, [rbx]
|
|
vpcmpeqw k3, zmm24, [rbx+r11*8+256]
|
|
vpcmpeqw k3, zmm24, [rbx+r11*8-256]
|
|
vpcmpeqw k3{k5}, xmm7, xmm0
|
|
vpcmpeqw k3{k5}, xmm7, [rbx]
|
|
vpcmpeqw k3{k5}, xmm7, [rbx+r11*8+256]
|
|
vpcmpeqw k3{k5}, xmm7, [rbx+r11*8-256]
|
|
vpcmpeqw k3{k5}, ymm13, ymm15
|
|
vpcmpeqw k3{k5}, ymm13, [rbx]
|
|
vpcmpeqw k3{k5}, ymm13, [rbx+r11*8+256]
|
|
vpcmpeqw k3{k5}, ymm13, [rbx+r11*8-256]
|
|
vpcmpeqw k3{k5}, zmm24, zmm31
|
|
vpcmpeqw k3{k5}, zmm24, [rbx]
|
|
vpcmpeqw k3{k5}, zmm24, [rbx+r11*8+256]
|
|
vpcmpeqw k3{k5}, zmm24, [rbx+r11*8-256]
|
|
vpcmpgtb k3, xmm7, xmm0
|
|
vpcmpgtb k3, xmm7, [rbx]
|
|
vpcmpgtb k3, xmm7, [rbx+r11*8+256]
|
|
vpcmpgtb k3, xmm7, [rbx+r11*8-256]
|
|
vpcmpgtb k3, ymm13, ymm15
|
|
vpcmpgtb k3, ymm13, [rbx]
|
|
vpcmpgtb k3, ymm13, [rbx+r11*8+256]
|
|
vpcmpgtb k3, ymm13, [rbx+r11*8-256]
|
|
vpcmpgtb k3, zmm24, zmm31
|
|
vpcmpgtb k3, zmm24, [rbx]
|
|
vpcmpgtb k3, zmm24, [rbx+r11*8+256]
|
|
vpcmpgtb k3, zmm24, [rbx+r11*8-256]
|
|
vpcmpgtb k3{k5}, xmm7, xmm0
|
|
vpcmpgtb k3{k5}, xmm7, [rbx]
|
|
vpcmpgtb k3{k5}, xmm7, [rbx+r11*8+256]
|
|
vpcmpgtb k3{k5}, xmm7, [rbx+r11*8-256]
|
|
vpcmpgtb k3{k5}, ymm13, ymm15
|
|
vpcmpgtb k3{k5}, ymm13, [rbx]
|
|
vpcmpgtb k3{k5}, ymm13, [rbx+r11*8+256]
|
|
vpcmpgtb k3{k5}, ymm13, [rbx+r11*8-256]
|
|
vpcmpgtb k3{k5}, zmm24, zmm31
|
|
vpcmpgtb k3{k5}, zmm24, [rbx]
|
|
vpcmpgtb k3{k5}, zmm24, [rbx+r11*8+256]
|
|
vpcmpgtb k3{k5}, zmm24, [rbx+r11*8-256]
|
|
vpcmpgtw k3, xmm7, xmm0
|
|
vpcmpgtw k3, xmm7, [rbx]
|
|
vpcmpgtw k3, xmm7, [rbx+r11*8+256]
|
|
vpcmpgtw k3, xmm7, [rbx+r11*8-256]
|
|
vpcmpgtw k3, ymm13, ymm15
|
|
vpcmpgtw k3, ymm13, [rbx]
|
|
vpcmpgtw k3, ymm13, [rbx+r11*8+256]
|
|
vpcmpgtw k3, ymm13, [rbx+r11*8-256]
|
|
vpcmpgtw k3, zmm24, zmm31
|
|
vpcmpgtw k3, zmm24, [rbx]
|
|
vpcmpgtw k3, zmm24, [rbx+r11*8+256]
|
|
vpcmpgtw k3, zmm24, [rbx+r11*8-256]
|
|
vpcmpgtw k3{k5}, xmm7, xmm0
|
|
vpcmpgtw k3{k5}, xmm7, [rbx]
|
|
vpcmpgtw k3{k5}, xmm7, [rbx+r11*8+256]
|
|
vpcmpgtw k3{k5}, xmm7, [rbx+r11*8-256]
|
|
vpcmpgtw k3{k5}, ymm13, ymm15
|
|
vpcmpgtw k3{k5}, ymm13, [rbx]
|
|
vpcmpgtw k3{k5}, ymm13, [rbx+r11*8+256]
|
|
vpcmpgtw k3{k5}, ymm13, [rbx+r11*8-256]
|
|
vpcmpgtw k3{k5}, zmm24, zmm31
|
|
vpcmpgtw k3{k5}, zmm24, [rbx]
|
|
vpcmpgtw k3{k5}, zmm24, [rbx+r11*8+256]
|
|
vpcmpgtw k3{k5}, zmm24, [rbx+r11*8-256]
|
|
vpcmpub k3, xmm7, xmm0, 10
|
|
vpcmpub k3, xmm7, [rbx], 10
|
|
vpcmpub k3, xmm7, [rbx+r11*8+256], 10
|
|
vpcmpub k3, xmm7, [rbx+r11*8-256], 10
|
|
vpcmpub k3, ymm13, ymm15, 10
|
|
vpcmpub k3, ymm13, [rbx], 10
|
|
vpcmpub k3, ymm13, [rbx+r11*8+256], 10
|
|
vpcmpub k3, ymm13, [rbx+r11*8-256], 10
|
|
vpcmpub k3, zmm24, zmm31, 10
|
|
vpcmpub k3, zmm24, [rbx], 10
|
|
vpcmpub k3, zmm24, [rbx+r11*8+256], 10
|
|
vpcmpub k3, zmm24, [rbx+r11*8-256], 10
|
|
vpcmpub k3{k5}, xmm7, xmm0, 10
|
|
vpcmpub k3{k5}, xmm7, [rbx], 10
|
|
vpcmpub k3{k5}, xmm7, [rbx+r11*8+256], 10
|
|
vpcmpub k3{k5}, xmm7, [rbx+r11*8-256], 10
|
|
vpcmpub k3{k5}, ymm13, ymm15, 10
|
|
vpcmpub k3{k5}, ymm13, [rbx], 10
|
|
vpcmpub k3{k5}, ymm13, [rbx+r11*8+256], 10
|
|
vpcmpub k3{k5}, ymm13, [rbx+r11*8-256], 10
|
|
vpcmpub k3{k5}, zmm24, zmm31, 10
|
|
vpcmpub k3{k5}, zmm24, [rbx], 10
|
|
vpcmpub k3{k5}, zmm24, [rbx+r11*8+256], 10
|
|
vpcmpub k3{k5}, zmm24, [rbx+r11*8-256], 10
|
|
vpcmpuw k3, xmm7, xmm0, 10
|
|
vpcmpuw k3, xmm7, [rbx], 10
|
|
vpcmpuw k3, xmm7, [rbx+r11*8+256], 10
|
|
vpcmpuw k3, xmm7, [rbx+r11*8-256], 10
|
|
vpcmpuw k3, ymm13, ymm15, 10
|
|
vpcmpuw k3, ymm13, [rbx], 10
|
|
vpcmpuw k3, ymm13, [rbx+r11*8+256], 10
|
|
vpcmpuw k3, ymm13, [rbx+r11*8-256], 10
|
|
vpcmpuw k3, zmm24, zmm31, 10
|
|
vpcmpuw k3, zmm24, [rbx], 10
|
|
vpcmpuw k3, zmm24, [rbx+r11*8+256], 10
|
|
vpcmpuw k3, zmm24, [rbx+r11*8-256], 10
|
|
vpcmpuw k3{k5}, xmm7, xmm0, 10
|
|
vpcmpuw k3{k5}, xmm7, [rbx], 10
|
|
vpcmpuw k3{k5}, xmm7, [rbx+r11*8+256], 10
|
|
vpcmpuw k3{k5}, xmm7, [rbx+r11*8-256], 10
|
|
vpcmpuw k3{k5}, ymm13, ymm15, 10
|
|
vpcmpuw k3{k5}, ymm13, [rbx], 10
|
|
vpcmpuw k3{k5}, ymm13, [rbx+r11*8+256], 10
|
|
vpcmpuw k3{k5}, ymm13, [rbx+r11*8-256], 10
|
|
vpcmpuw k3{k5}, zmm24, zmm31, 10
|
|
vpcmpuw k3{k5}, zmm24, [rbx], 10
|
|
vpcmpuw k3{k5}, zmm24, [rbx+r11*8+256], 10
|
|
vpcmpuw k3{k5}, zmm24, [rbx+r11*8-256], 10
|
|
vpcmpw k3, xmm7, xmm0, 10
|
|
vpcmpw k3, xmm7, [rbx], 10
|
|
vpcmpw k3, xmm7, [rbx+r11*8+256], 10
|
|
vpcmpw k3, xmm7, [rbx+r11*8-256], 10
|
|
vpcmpw k3, ymm13, ymm15, 10
|
|
vpcmpw k3, ymm13, [rbx], 10
|
|
vpcmpw k3, ymm13, [rbx+r11*8+256], 10
|
|
vpcmpw k3, ymm13, [rbx+r11*8-256], 10
|
|
vpcmpw k3, zmm24, zmm31, 10
|
|
vpcmpw k3, zmm24, [rbx], 10
|
|
vpcmpw k3, zmm24, [rbx+r11*8+256], 10
|
|
vpcmpw k3, zmm24, [rbx+r11*8-256], 10
|
|
vpcmpw k3{k5}, xmm7, xmm0, 10
|
|
vpcmpw k3{k5}, xmm7, [rbx], 10
|
|
vpcmpw k3{k5}, xmm7, [rbx+r11*8+256], 10
|
|
vpcmpw k3{k5}, xmm7, [rbx+r11*8-256], 10
|
|
vpcmpw k3{k5}, ymm13, ymm15, 10
|
|
vpcmpw k3{k5}, ymm13, [rbx], 10
|
|
vpcmpw k3{k5}, ymm13, [rbx+r11*8+256], 10
|
|
vpcmpw k3{k5}, ymm13, [rbx+r11*8-256], 10
|
|
vpcmpw k3{k5}, zmm24, zmm31, 10
|
|
vpcmpw k3{k5}, zmm24, [rbx], 10
|
|
vpcmpw k3{k5}, zmm24, [rbx+r11*8+256], 10
|
|
vpcmpw k3{k5}, zmm24, [rbx+r11*8-256], 10
|
|
vpermi2w xmm2, xmm7, xmm0
|
|
vpermi2w xmm2, xmm7, [rbx]
|
|
vpermi2w xmm2, xmm7, [rbx+r11*8+256]
|
|
vpermi2w xmm2, xmm7, [rbx+r11*8-256]
|
|
vpermi2w xmm2{k5}, xmm7, xmm0
|
|
vpermi2w xmm2{k5}, xmm7, [rbx]
|
|
vpermi2w xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpermi2w xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpermi2w xmm2{k5}{z}, xmm7, xmm0
|
|
vpermi2w xmm2{k5}{z}, xmm7, [rbx]
|
|
vpermi2w xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpermi2w xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpermi2w ymm16, ymm13, ymm15
|
|
vpermi2w ymm16, ymm13, [rbx]
|
|
vpermi2w ymm16, ymm13, [rbx+r11*8+256]
|
|
vpermi2w ymm16, ymm13, [rbx+r11*8-256]
|
|
vpermi2w ymm16{k5}, ymm13, ymm15
|
|
vpermi2w ymm16{k5}, ymm13, [rbx]
|
|
vpermi2w ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpermi2w ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpermi2w ymm16{k5}{z}, ymm13, ymm15
|
|
vpermi2w ymm16{k5}{z}, ymm13, [rbx]
|
|
vpermi2w ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpermi2w ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpermi2w zmm24, zmm24, zmm31
|
|
vpermi2w zmm24, zmm24, [rbx]
|
|
vpermi2w zmm24, zmm24, [rbx+r11*8+256]
|
|
vpermi2w zmm24, zmm24, [rbx+r11*8-256]
|
|
vpermi2w zmm24{k5}, zmm24, zmm31
|
|
vpermi2w zmm24{k5}, zmm24, [rbx]
|
|
vpermi2w zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpermi2w zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpermi2w zmm24{k5}{z}, zmm24, zmm31
|
|
vpermi2w zmm24{k5}{z}, zmm24, [rbx]
|
|
vpermi2w zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpermi2w zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpermt2w xmm2, xmm7, xmm0
|
|
vpermt2w xmm2, xmm7, [rbx]
|
|
vpermt2w xmm2, xmm7, [rbx+r11*8+256]
|
|
vpermt2w xmm2, xmm7, [rbx+r11*8-256]
|
|
vpermt2w xmm2{k5}, xmm7, xmm0
|
|
vpermt2w xmm2{k5}, xmm7, [rbx]
|
|
vpermt2w xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpermt2w xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpermt2w xmm2{k5}{z}, xmm7, xmm0
|
|
vpermt2w xmm2{k5}{z}, xmm7, [rbx]
|
|
vpermt2w xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpermt2w xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpermt2w ymm16, ymm13, ymm15
|
|
vpermt2w ymm16, ymm13, [rbx]
|
|
vpermt2w ymm16, ymm13, [rbx+r11*8+256]
|
|
vpermt2w ymm16, ymm13, [rbx+r11*8-256]
|
|
vpermt2w ymm16{k5}, ymm13, ymm15
|
|
vpermt2w ymm16{k5}, ymm13, [rbx]
|
|
vpermt2w ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpermt2w ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpermt2w ymm16{k5}{z}, ymm13, ymm15
|
|
vpermt2w ymm16{k5}{z}, ymm13, [rbx]
|
|
vpermt2w ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpermt2w ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpermt2w zmm24, zmm24, zmm31
|
|
vpermt2w zmm24, zmm24, [rbx]
|
|
vpermt2w zmm24, zmm24, [rbx+r11*8+256]
|
|
vpermt2w zmm24, zmm24, [rbx+r11*8-256]
|
|
vpermt2w zmm24{k5}, zmm24, zmm31
|
|
vpermt2w zmm24{k5}, zmm24, [rbx]
|
|
vpermt2w zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpermt2w zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpermt2w zmm24{k5}{z}, zmm24, zmm31
|
|
vpermt2w zmm24{k5}{z}, zmm24, [rbx]
|
|
vpermt2w zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpermt2w zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpermw xmm2, xmm7, xmm0
|
|
vpermw xmm2, xmm7, [rbx]
|
|
vpermw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpermw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpermw xmm2{k5}, xmm7, xmm0
|
|
vpermw xmm2{k5}, xmm7, [rbx]
|
|
vpermw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpermw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpermw xmm2{k5}{z}, xmm7, xmm0
|
|
vpermw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpermw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpermw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpermw ymm16, ymm13, ymm15
|
|
vpermw ymm16, ymm13, [rbx]
|
|
vpermw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpermw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpermw ymm16{k5}, ymm13, ymm15
|
|
vpermw ymm16{k5}, ymm13, [rbx]
|
|
vpermw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpermw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpermw ymm16{k5}{z}, ymm13, ymm15
|
|
vpermw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpermw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpermw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpermw zmm24, zmm24, zmm31
|
|
vpermw zmm24, zmm24, [rbx]
|
|
vpermw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpermw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpermw zmm24{k5}, zmm24, zmm31
|
|
vpermw zmm24{k5}, zmm24, [rbx]
|
|
vpermw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpermw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpermw zmm24{k5}{z}, zmm24, zmm31
|
|
vpermw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpermw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpermw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpextrb [rbx], xmm2, 10
|
|
vpextrb [rbx+rsi*8+256], xmm2, 10
|
|
vpextrb [rbx+rsi*8-256], xmm2, 10
|
|
vpextrb cl, xmm2, 10
|
|
vpextrb cx, xmm2, 10
|
|
vpextrb ecx, xmm2, 10
|
|
vpextrb rcx, xmm2, 10
|
|
vpextrw cx, xmm0, 10
|
|
vpextrw ecx, xmm0, 10
|
|
vpextrw rcx, xmm0, 10
|
|
vpextrw [rbx], xmm2, 10
|
|
vpextrw [rbx+rsi*8+256], xmm2, 10
|
|
vpextrw [rbx+rsi*8-256], xmm2, 10
|
|
vpextrw cx, xmm2, 10
|
|
vpextrw ecx, xmm2, 10
|
|
vpextrw rcx, xmm2, 10
|
|
vpinsrb xmm2, xmm7, [rbx], 10
|
|
vpinsrb xmm2, xmm7, [rbx+rsi*8+256], 10
|
|
vpinsrb xmm2, xmm7, [rbx+rsi*8-256], 10
|
|
vpinsrb xmm2, xmm7, cl, 10
|
|
vpinsrb xmm2, xmm7, ecx, 10
|
|
vpinsrw xmm2, xmm7, [rbx], 10
|
|
vpinsrw xmm2, xmm7, [rbx+rsi*8+256], 10
|
|
vpinsrw xmm2, xmm7, [rbx+rsi*8-256], 10
|
|
vpinsrw xmm2, xmm7, cx, 10
|
|
vpinsrw xmm2, xmm7, ecx, 10
|
|
vpmaddubsw xmm2, xmm7, xmm0
|
|
vpmaddubsw xmm2, xmm7, [rbx]
|
|
vpmaddubsw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmaddubsw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmaddubsw xmm2{k5}, xmm7, xmm0
|
|
vpmaddubsw xmm2{k5}, xmm7, [rbx]
|
|
vpmaddubsw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmaddubsw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmaddubsw xmm2{k5}{z}, xmm7, xmm0
|
|
vpmaddubsw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmaddubsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmaddubsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmaddubsw ymm16, ymm13, ymm15
|
|
vpmaddubsw ymm16, ymm13, [rbx]
|
|
vpmaddubsw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmaddubsw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmaddubsw ymm16{k5}, ymm13, ymm15
|
|
vpmaddubsw ymm16{k5}, ymm13, [rbx]
|
|
vpmaddubsw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmaddubsw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmaddubsw ymm16{k5}{z}, ymm13, ymm15
|
|
vpmaddubsw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmaddubsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmaddubsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmaddubsw zmm24, zmm24, zmm31
|
|
vpmaddubsw zmm24, zmm24, [rbx]
|
|
vpmaddubsw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmaddubsw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmaddubsw zmm24{k5}, zmm24, zmm31
|
|
vpmaddubsw zmm24{k5}, zmm24, [rbx]
|
|
vpmaddubsw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmaddubsw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmaddubsw zmm24{k5}{z}, zmm24, zmm31
|
|
vpmaddubsw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmaddubsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmaddubsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpmaddwd xmm2, xmm7, xmm0
|
|
vpmaddwd xmm2, xmm7, [rbx]
|
|
vpmaddwd xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmaddwd xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmaddwd xmm2{k5}, xmm7, xmm0
|
|
vpmaddwd xmm2{k5}, xmm7, [rbx]
|
|
vpmaddwd xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmaddwd xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmaddwd xmm2{k5}{z}, xmm7, xmm0
|
|
vpmaddwd xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmaddwd xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmaddwd xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmaddwd ymm16, ymm13, ymm15
|
|
vpmaddwd ymm16, ymm13, [rbx]
|
|
vpmaddwd ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmaddwd ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmaddwd ymm16{k5}, ymm13, ymm15
|
|
vpmaddwd ymm16{k5}, ymm13, [rbx]
|
|
vpmaddwd ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmaddwd ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmaddwd ymm16{k5}{z}, ymm13, ymm15
|
|
vpmaddwd ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmaddwd ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmaddwd ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmaddwd zmm24, zmm24, zmm31
|
|
vpmaddwd zmm24, zmm24, [rbx]
|
|
vpmaddwd zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmaddwd zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmaddwd zmm24{k5}, zmm24, zmm31
|
|
vpmaddwd zmm24{k5}, zmm24, [rbx]
|
|
vpmaddwd zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmaddwd zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmaddwd zmm24{k5}{z}, zmm24, zmm31
|
|
vpmaddwd zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmaddwd zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmaddwd zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpmaxsb xmm2, xmm7, xmm0
|
|
vpmaxsb xmm2, xmm7, [rbx]
|
|
vpmaxsb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmaxsb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmaxsb xmm2{k5}, xmm7, xmm0
|
|
vpmaxsb xmm2{k5}, xmm7, [rbx]
|
|
vpmaxsb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmaxsb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmaxsb xmm2{k5}{z}, xmm7, xmm0
|
|
vpmaxsb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmaxsb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmaxsb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmaxsb ymm16, ymm13, ymm15
|
|
vpmaxsb ymm16, ymm13, [rbx]
|
|
vpmaxsb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmaxsb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmaxsb ymm16{k5}, ymm13, ymm15
|
|
vpmaxsb ymm16{k5}, ymm13, [rbx]
|
|
vpmaxsb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmaxsb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmaxsb ymm16{k5}{z}, ymm13, ymm15
|
|
vpmaxsb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmaxsb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmaxsb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmaxsb zmm24, zmm24, zmm31
|
|
vpmaxsb zmm24, zmm24, [rbx]
|
|
vpmaxsb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmaxsb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmaxsb zmm24{k5}, zmm24, zmm31
|
|
vpmaxsb zmm24{k5}, zmm24, [rbx]
|
|
vpmaxsb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmaxsb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmaxsb zmm24{k5}{z}, zmm24, zmm31
|
|
vpmaxsb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmaxsb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmaxsb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpmaxsw xmm2, xmm7, xmm0
|
|
vpmaxsw xmm2, xmm7, [rbx]
|
|
vpmaxsw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmaxsw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmaxsw xmm2{k5}, xmm7, xmm0
|
|
vpmaxsw xmm2{k5}, xmm7, [rbx]
|
|
vpmaxsw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmaxsw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmaxsw xmm2{k5}{z}, xmm7, xmm0
|
|
vpmaxsw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmaxsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmaxsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmaxsw ymm16, ymm13, ymm15
|
|
vpmaxsw ymm16, ymm13, [rbx]
|
|
vpmaxsw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmaxsw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmaxsw ymm16{k5}, ymm13, ymm15
|
|
vpmaxsw ymm16{k5}, ymm13, [rbx]
|
|
vpmaxsw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmaxsw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmaxsw ymm16{k5}{z}, ymm13, ymm15
|
|
vpmaxsw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmaxsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmaxsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmaxsw zmm24, zmm24, zmm31
|
|
vpmaxsw zmm24, zmm24, [rbx]
|
|
vpmaxsw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmaxsw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmaxsw zmm24{k5}, zmm24, zmm31
|
|
vpmaxsw zmm24{k5}, zmm24, [rbx]
|
|
vpmaxsw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmaxsw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmaxsw zmm24{k5}{z}, zmm24, zmm31
|
|
vpmaxsw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmaxsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmaxsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpmaxub xmm2, xmm7, xmm0
|
|
vpmaxub xmm2, xmm7, [rbx]
|
|
vpmaxub xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmaxub xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmaxub xmm2{k5}, xmm7, xmm0
|
|
vpmaxub xmm2{k5}, xmm7, [rbx]
|
|
vpmaxub xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmaxub xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmaxub xmm2{k5}{z}, xmm7, xmm0
|
|
vpmaxub xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmaxub xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmaxub xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmaxub ymm16, ymm13, ymm15
|
|
vpmaxub ymm16, ymm13, [rbx]
|
|
vpmaxub ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmaxub ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmaxub ymm16{k5}, ymm13, ymm15
|
|
vpmaxub ymm16{k5}, ymm13, [rbx]
|
|
vpmaxub ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmaxub ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmaxub ymm16{k5}{z}, ymm13, ymm15
|
|
vpmaxub ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmaxub ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmaxub ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmaxub zmm24, zmm24, zmm31
|
|
vpmaxub zmm24, zmm24, [rbx]
|
|
vpmaxub zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmaxub zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmaxub zmm24{k5}, zmm24, zmm31
|
|
vpmaxub zmm24{k5}, zmm24, [rbx]
|
|
vpmaxub zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmaxub zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmaxub zmm24{k5}{z}, zmm24, zmm31
|
|
vpmaxub zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmaxub zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmaxub zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpmaxuw xmm2, xmm7, xmm0
|
|
vpmaxuw xmm2, xmm7, [rbx]
|
|
vpmaxuw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmaxuw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmaxuw xmm2{k5}, xmm7, xmm0
|
|
vpmaxuw xmm2{k5}, xmm7, [rbx]
|
|
vpmaxuw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmaxuw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmaxuw xmm2{k5}{z}, xmm7, xmm0
|
|
vpmaxuw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmaxuw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmaxuw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmaxuw ymm16, ymm13, ymm15
|
|
vpmaxuw ymm16, ymm13, [rbx]
|
|
vpmaxuw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmaxuw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmaxuw ymm16{k5}, ymm13, ymm15
|
|
vpmaxuw ymm16{k5}, ymm13, [rbx]
|
|
vpmaxuw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmaxuw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmaxuw ymm16{k5}{z}, ymm13, ymm15
|
|
vpmaxuw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmaxuw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmaxuw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmaxuw zmm24, zmm24, zmm31
|
|
vpmaxuw zmm24, zmm24, [rbx]
|
|
vpmaxuw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmaxuw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmaxuw zmm24{k5}, zmm24, zmm31
|
|
vpmaxuw zmm24{k5}, zmm24, [rbx]
|
|
vpmaxuw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmaxuw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmaxuw zmm24{k5}{z}, zmm24, zmm31
|
|
vpmaxuw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmaxuw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmaxuw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpminsb xmm2, xmm7, xmm0
|
|
vpminsb xmm2, xmm7, [rbx]
|
|
vpminsb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpminsb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpminsb xmm2{k5}, xmm7, xmm0
|
|
vpminsb xmm2{k5}, xmm7, [rbx]
|
|
vpminsb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpminsb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpminsb xmm2{k5}{z}, xmm7, xmm0
|
|
vpminsb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpminsb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpminsb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpminsb ymm16, ymm13, ymm15
|
|
vpminsb ymm16, ymm13, [rbx]
|
|
vpminsb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpminsb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpminsb ymm16{k5}, ymm13, ymm15
|
|
vpminsb ymm16{k5}, ymm13, [rbx]
|
|
vpminsb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpminsb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpminsb ymm16{k5}{z}, ymm13, ymm15
|
|
vpminsb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpminsb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpminsb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpminsb zmm24, zmm24, zmm31
|
|
vpminsb zmm24, zmm24, [rbx]
|
|
vpminsb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpminsb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpminsb zmm24{k5}, zmm24, zmm31
|
|
vpminsb zmm24{k5}, zmm24, [rbx]
|
|
vpminsb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpminsb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpminsb zmm24{k5}{z}, zmm24, zmm31
|
|
vpminsb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpminsb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpminsb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpminsw xmm2, xmm7, xmm0
|
|
vpminsw xmm2, xmm7, [rbx]
|
|
vpminsw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpminsw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpminsw xmm2{k5}, xmm7, xmm0
|
|
vpminsw xmm2{k5}, xmm7, [rbx]
|
|
vpminsw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpminsw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpminsw xmm2{k5}{z}, xmm7, xmm0
|
|
vpminsw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpminsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpminsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpminsw ymm16, ymm13, ymm15
|
|
vpminsw ymm16, ymm13, [rbx]
|
|
vpminsw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpminsw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpminsw ymm16{k5}, ymm13, ymm15
|
|
vpminsw ymm16{k5}, ymm13, [rbx]
|
|
vpminsw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpminsw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpminsw ymm16{k5}{z}, ymm13, ymm15
|
|
vpminsw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpminsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpminsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpminsw zmm24, zmm24, zmm31
|
|
vpminsw zmm24, zmm24, [rbx]
|
|
vpminsw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpminsw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpminsw zmm24{k5}, zmm24, zmm31
|
|
vpminsw zmm24{k5}, zmm24, [rbx]
|
|
vpminsw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpminsw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpminsw zmm24{k5}{z}, zmm24, zmm31
|
|
vpminsw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpminsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpminsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpminub xmm2, xmm7, xmm0
|
|
vpminub xmm2, xmm7, [rbx]
|
|
vpminub xmm2, xmm7, [rbx+r11*8+256]
|
|
vpminub xmm2, xmm7, [rbx+r11*8-256]
|
|
vpminub xmm2{k5}, xmm7, xmm0
|
|
vpminub xmm2{k5}, xmm7, [rbx]
|
|
vpminub xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpminub xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpminub xmm2{k5}{z}, xmm7, xmm0
|
|
vpminub xmm2{k5}{z}, xmm7, [rbx]
|
|
vpminub xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpminub xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpminub ymm16, ymm13, ymm15
|
|
vpminub ymm16, ymm13, [rbx]
|
|
vpminub ymm16, ymm13, [rbx+r11*8+256]
|
|
vpminub ymm16, ymm13, [rbx+r11*8-256]
|
|
vpminub ymm16{k5}, ymm13, ymm15
|
|
vpminub ymm16{k5}, ymm13, [rbx]
|
|
vpminub ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpminub ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpminub ymm16{k5}{z}, ymm13, ymm15
|
|
vpminub ymm16{k5}{z}, ymm13, [rbx]
|
|
vpminub ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpminub ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpminub zmm24, zmm24, zmm31
|
|
vpminub zmm24, zmm24, [rbx]
|
|
vpminub zmm24, zmm24, [rbx+r11*8+256]
|
|
vpminub zmm24, zmm24, [rbx+r11*8-256]
|
|
vpminub zmm24{k5}, zmm24, zmm31
|
|
vpminub zmm24{k5}, zmm24, [rbx]
|
|
vpminub zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpminub zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpminub zmm24{k5}{z}, zmm24, zmm31
|
|
vpminub zmm24{k5}{z}, zmm24, [rbx]
|
|
vpminub zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpminub zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpminuw xmm2, xmm7, xmm0
|
|
vpminuw xmm2, xmm7, [rbx]
|
|
vpminuw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpminuw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpminuw xmm2{k5}, xmm7, xmm0
|
|
vpminuw xmm2{k5}, xmm7, [rbx]
|
|
vpminuw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpminuw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpminuw xmm2{k5}{z}, xmm7, xmm0
|
|
vpminuw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpminuw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpminuw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpminuw ymm16, ymm13, ymm15
|
|
vpminuw ymm16, ymm13, [rbx]
|
|
vpminuw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpminuw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpminuw ymm16{k5}, ymm13, ymm15
|
|
vpminuw ymm16{k5}, ymm13, [rbx]
|
|
vpminuw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpminuw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpminuw ymm16{k5}{z}, ymm13, ymm15
|
|
vpminuw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpminuw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpminuw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpminuw zmm24, zmm24, zmm31
|
|
vpminuw zmm24, zmm24, [rbx]
|
|
vpminuw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpminuw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpminuw zmm24{k5}, zmm24, zmm31
|
|
vpminuw zmm24{k5}, zmm24, [rbx]
|
|
vpminuw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpminuw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpminuw zmm24{k5}{z}, zmm24, zmm31
|
|
vpminuw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpminuw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpminuw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpmovb2m k3, xmm0
|
|
vpmovb2m k3, ymm15
|
|
vpmovb2m k3, zmm31
|
|
vpmovm2b xmm2, k1
|
|
vpmovm2b ymm16, k1
|
|
vpmovm2b zmm24, k1
|
|
vpmovm2w xmm2, k1
|
|
vpmovm2w ymm16, k1
|
|
vpmovm2w zmm24, k1
|
|
vpmovswb xmm0, xmm2
|
|
vpmovswb xmm0, ymm16
|
|
vpmovswb ymm15, zmm24
|
|
vpmovswb [rbx], xmm2
|
|
vpmovswb [rbx], ymm16
|
|
vpmovswb [rbx], zmm24
|
|
vpmovswb [rbx+r11*8+256], xmm2
|
|
vpmovswb [rbx+r11*8+256], ymm16
|
|
vpmovswb [rbx+r11*8+256], zmm24
|
|
vpmovswb [rbx+r11*8-256], xmm2
|
|
vpmovswb [rbx+r11*8-256], ymm16
|
|
vpmovswb [rbx+r11*8-256], zmm24
|
|
vpmovsxbw xmm2, xmm0
|
|
vpmovsxbw xmm2, [rbx]
|
|
vpmovsxbw xmm2, [rbx+r11*8+256]
|
|
vpmovsxbw xmm2, [rbx+r11*8-256]
|
|
vpmovsxbw xmm2{k5}, xmm0
|
|
vpmovsxbw xmm2{k5}, [rbx]
|
|
vpmovsxbw xmm2{k5}, [rbx+r11*8+256]
|
|
vpmovsxbw xmm2{k5}, [rbx+r11*8-256]
|
|
vpmovsxbw xmm2{k5}{z}, xmm0
|
|
vpmovsxbw xmm2{k5}{z}, [rbx]
|
|
vpmovsxbw xmm2{k5}{z}, [rbx+r11*8+256]
|
|
vpmovsxbw xmm2{k5}{z}, [rbx+r11*8-256]
|
|
vpmovsxbw ymm16, xmm0
|
|
vpmovsxbw ymm16, [rbx]
|
|
vpmovsxbw ymm16, [rbx+r11*8+256]
|
|
vpmovsxbw ymm16, [rbx+r11*8-256]
|
|
vpmovsxbw ymm16{k5}, xmm0
|
|
vpmovsxbw ymm16{k5}, [rbx]
|
|
vpmovsxbw ymm16{k5}, [rbx+r11*8+256]
|
|
vpmovsxbw ymm16{k5}, [rbx+r11*8-256]
|
|
vpmovsxbw ymm16{k5}{z}, xmm0
|
|
vpmovsxbw ymm16{k5}{z}, [rbx]
|
|
vpmovsxbw ymm16{k5}{z}, [rbx+r11*8+256]
|
|
vpmovsxbw ymm16{k5}{z}, [rbx+r11*8-256]
|
|
vpmovsxbw zmm24, ymm15
|
|
vpmovsxbw zmm24, [rbx]
|
|
vpmovsxbw zmm24, [rbx+r11*8+256]
|
|
vpmovsxbw zmm24, [rbx+r11*8-256]
|
|
vpmovsxbw zmm24{k5}, ymm15
|
|
vpmovsxbw zmm24{k5}, [rbx]
|
|
vpmovsxbw zmm24{k5}, [rbx+r11*8+256]
|
|
vpmovsxbw zmm24{k5}, [rbx+r11*8-256]
|
|
vpmovsxbw zmm24{k5}{z}, ymm15
|
|
vpmovsxbw zmm24{k5}{z}, [rbx]
|
|
vpmovsxbw zmm24{k5}{z}, [rbx+r11*8+256]
|
|
vpmovsxbw zmm24{k5}{z}, [rbx+r11*8-256]
|
|
vpmovuswb xmm0, xmm2
|
|
vpmovuswb xmm0, ymm16
|
|
vpmovuswb ymm15, zmm24
|
|
vpmovuswb [rbx], xmm2
|
|
vpmovuswb [rbx], ymm16
|
|
vpmovuswb [rbx], zmm24
|
|
vpmovuswb [rbx+r11*8+256], xmm2
|
|
vpmovuswb [rbx+r11*8+256], ymm16
|
|
vpmovuswb [rbx+r11*8+256], zmm24
|
|
vpmovuswb [rbx+r11*8-256], xmm2
|
|
vpmovuswb [rbx+r11*8-256], ymm16
|
|
vpmovuswb [rbx+r11*8-256], zmm24
|
|
vpmovw2m k3, xmm0
|
|
vpmovw2m k3, ymm15
|
|
vpmovw2m k3, zmm31
|
|
vpmovwb xmm0, xmm2
|
|
vpmovwb xmm0, ymm16
|
|
vpmovwb ymm15, zmm24
|
|
vpmovwb [rbx], xmm2
|
|
vpmovwb [rbx], ymm16
|
|
vpmovwb [rbx], zmm24
|
|
vpmovwb [rbx+r11*8+256], xmm2
|
|
vpmovwb [rbx+r11*8+256], ymm16
|
|
vpmovwb [rbx+r11*8+256], zmm24
|
|
vpmovwb [rbx+r11*8-256], xmm2
|
|
vpmovwb [rbx+r11*8-256], ymm16
|
|
vpmovwb [rbx+r11*8-256], zmm24
|
|
vpmovzxbw xmm2, xmm0
|
|
vpmovzxbw xmm2, [rbx]
|
|
vpmovzxbw xmm2, [rbx+r11*8+256]
|
|
vpmovzxbw xmm2, [rbx+r11*8-256]
|
|
vpmovzxbw xmm2{k5}, xmm0
|
|
vpmovzxbw xmm2{k5}, [rbx]
|
|
vpmovzxbw xmm2{k5}, [rbx+r11*8+256]
|
|
vpmovzxbw xmm2{k5}, [rbx+r11*8-256]
|
|
vpmovzxbw xmm2{k5}{z}, xmm0
|
|
vpmovzxbw xmm2{k5}{z}, [rbx]
|
|
vpmovzxbw xmm2{k5}{z}, [rbx+r11*8+256]
|
|
vpmovzxbw xmm2{k5}{z}, [rbx+r11*8-256]
|
|
vpmovzxbw ymm16, xmm0
|
|
vpmovzxbw ymm16, [rbx]
|
|
vpmovzxbw ymm16, [rbx+r11*8+256]
|
|
vpmovzxbw ymm16, [rbx+r11*8-256]
|
|
vpmovzxbw ymm16{k5}, xmm0
|
|
vpmovzxbw ymm16{k5}, [rbx]
|
|
vpmovzxbw ymm16{k5}, [rbx+r11*8+256]
|
|
vpmovzxbw ymm16{k5}, [rbx+r11*8-256]
|
|
vpmovzxbw ymm16{k5}{z}, xmm0
|
|
vpmovzxbw ymm16{k5}{z}, [rbx]
|
|
vpmovzxbw ymm16{k5}{z}, [rbx+r11*8+256]
|
|
vpmovzxbw ymm16{k5}{z}, [rbx+r11*8-256]
|
|
vpmovzxbw zmm24, ymm15
|
|
vpmovzxbw zmm24, [rbx]
|
|
vpmovzxbw zmm24, [rbx+r11*8+256]
|
|
vpmovzxbw zmm24, [rbx+r11*8-256]
|
|
vpmovzxbw zmm24{k5}, ymm15
|
|
vpmovzxbw zmm24{k5}, [rbx]
|
|
vpmovzxbw zmm24{k5}, [rbx+r11*8+256]
|
|
vpmovzxbw zmm24{k5}, [rbx+r11*8-256]
|
|
vpmovzxbw zmm24{k5}{z}, ymm15
|
|
vpmovzxbw zmm24{k5}{z}, [rbx]
|
|
vpmovzxbw zmm24{k5}{z}, [rbx+r11*8+256]
|
|
vpmovzxbw zmm24{k5}{z}, [rbx+r11*8-256]
|
|
vpmulhrsw xmm2, xmm7, xmm0
|
|
vpmulhrsw xmm2, xmm7, [rbx]
|
|
vpmulhrsw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmulhrsw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmulhrsw xmm2{k5}, xmm7, xmm0
|
|
vpmulhrsw xmm2{k5}, xmm7, [rbx]
|
|
vpmulhrsw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmulhrsw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmulhrsw xmm2{k5}{z}, xmm7, xmm0
|
|
vpmulhrsw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmulhrsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmulhrsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmulhrsw ymm16, ymm13, ymm15
|
|
vpmulhrsw ymm16, ymm13, [rbx]
|
|
vpmulhrsw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmulhrsw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmulhrsw ymm16{k5}, ymm13, ymm15
|
|
vpmulhrsw ymm16{k5}, ymm13, [rbx]
|
|
vpmulhrsw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmulhrsw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmulhrsw ymm16{k5}{z}, ymm13, ymm15
|
|
vpmulhrsw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmulhrsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmulhrsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmulhrsw zmm24, zmm24, zmm31
|
|
vpmulhrsw zmm24, zmm24, [rbx]
|
|
vpmulhrsw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmulhrsw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmulhrsw zmm24{k5}, zmm24, zmm31
|
|
vpmulhrsw zmm24{k5}, zmm24, [rbx]
|
|
vpmulhrsw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmulhrsw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmulhrsw zmm24{k5}{z}, zmm24, zmm31
|
|
vpmulhrsw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmulhrsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmulhrsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpmulhuw xmm2, xmm7, xmm0
|
|
vpmulhuw xmm2, xmm7, [rbx]
|
|
vpmulhuw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmulhuw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmulhuw xmm2{k5}, xmm7, xmm0
|
|
vpmulhuw xmm2{k5}, xmm7, [rbx]
|
|
vpmulhuw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmulhuw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmulhuw xmm2{k5}{z}, xmm7, xmm0
|
|
vpmulhuw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmulhuw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmulhuw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmulhuw ymm16, ymm13, ymm15
|
|
vpmulhuw ymm16, ymm13, [rbx]
|
|
vpmulhuw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmulhuw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmulhuw ymm16{k5}, ymm13, ymm15
|
|
vpmulhuw ymm16{k5}, ymm13, [rbx]
|
|
vpmulhuw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmulhuw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmulhuw ymm16{k5}{z}, ymm13, ymm15
|
|
vpmulhuw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmulhuw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmulhuw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmulhuw zmm24, zmm24, zmm31
|
|
vpmulhuw zmm24, zmm24, [rbx]
|
|
vpmulhuw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmulhuw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmulhuw zmm24{k5}, zmm24, zmm31
|
|
vpmulhuw zmm24{k5}, zmm24, [rbx]
|
|
vpmulhuw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmulhuw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmulhuw zmm24{k5}{z}, zmm24, zmm31
|
|
vpmulhuw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmulhuw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmulhuw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpmulhw xmm2, xmm7, xmm0
|
|
vpmulhw xmm2, xmm7, [rbx]
|
|
vpmulhw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmulhw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmulhw xmm2{k5}, xmm7, xmm0
|
|
vpmulhw xmm2{k5}, xmm7, [rbx]
|
|
vpmulhw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmulhw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmulhw xmm2{k5}{z}, xmm7, xmm0
|
|
vpmulhw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmulhw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmulhw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmulhw ymm16, ymm13, ymm15
|
|
vpmulhw ymm16, ymm13, [rbx]
|
|
vpmulhw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmulhw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmulhw ymm16{k5}, ymm13, ymm15
|
|
vpmulhw ymm16{k5}, ymm13, [rbx]
|
|
vpmulhw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmulhw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmulhw ymm16{k5}{z}, ymm13, ymm15
|
|
vpmulhw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmulhw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmulhw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmulhw zmm24, zmm24, zmm31
|
|
vpmulhw zmm24, zmm24, [rbx]
|
|
vpmulhw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmulhw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmulhw zmm24{k5}, zmm24, zmm31
|
|
vpmulhw zmm24{k5}, zmm24, [rbx]
|
|
vpmulhw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmulhw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmulhw zmm24{k5}{z}, zmm24, zmm31
|
|
vpmulhw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmulhw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmulhw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpmullw xmm2, xmm7, xmm0
|
|
vpmullw xmm2, xmm7, [rbx]
|
|
vpmullw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpmullw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpmullw xmm2{k5}, xmm7, xmm0
|
|
vpmullw xmm2{k5}, xmm7, [rbx]
|
|
vpmullw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpmullw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpmullw xmm2{k5}{z}, xmm7, xmm0
|
|
vpmullw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpmullw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpmullw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpmullw ymm16, ymm13, ymm15
|
|
vpmullw ymm16, ymm13, [rbx]
|
|
vpmullw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpmullw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpmullw ymm16{k5}, ymm13, ymm15
|
|
vpmullw ymm16{k5}, ymm13, [rbx]
|
|
vpmullw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpmullw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpmullw ymm16{k5}{z}, ymm13, ymm15
|
|
vpmullw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpmullw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpmullw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpmullw zmm24, zmm24, zmm31
|
|
vpmullw zmm24, zmm24, [rbx]
|
|
vpmullw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpmullw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpmullw zmm24{k5}, zmm24, zmm31
|
|
vpmullw zmm24{k5}, zmm24, [rbx]
|
|
vpmullw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpmullw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpmullw zmm24{k5}{z}, zmm24, zmm31
|
|
vpmullw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpmullw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpmullw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsadbw xmm2, xmm7, xmm0
|
|
vpsadbw xmm2, xmm7, [rbx]
|
|
vpsadbw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsadbw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsadbw ymm16, ymm13, ymm15
|
|
vpsadbw ymm16, ymm13, [rbx]
|
|
vpsadbw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsadbw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsadbw zmm24, zmm24, zmm31
|
|
vpsadbw zmm24, zmm24, [rbx]
|
|
vpsadbw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsadbw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpshufb xmm2, xmm7, xmm0
|
|
vpshufb xmm2, xmm7, [rbx]
|
|
vpshufb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpshufb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpshufb xmm2{k5}, xmm7, xmm0
|
|
vpshufb xmm2{k5}, xmm7, [rbx]
|
|
vpshufb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpshufb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpshufb xmm2{k5}{z}, xmm7, xmm0
|
|
vpshufb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpshufb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpshufb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpshufb ymm16, ymm13, ymm15
|
|
vpshufb ymm16, ymm13, [rbx]
|
|
vpshufb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpshufb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpshufb ymm16{k5}, ymm13, ymm15
|
|
vpshufb ymm16{k5}, ymm13, [rbx]
|
|
vpshufb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpshufb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpshufb ymm16{k5}{z}, ymm13, ymm15
|
|
vpshufb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpshufb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpshufb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpshufb zmm24, zmm24, zmm31
|
|
vpshufb zmm24, zmm24, [rbx]
|
|
vpshufb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpshufb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpshufb zmm24{k5}, zmm24, zmm31
|
|
vpshufb zmm24{k5}, zmm24, [rbx]
|
|
vpshufb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpshufb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpshufb zmm24{k5}{z}, zmm24, zmm31
|
|
vpshufb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpshufb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpshufb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpshufhw xmm2, xmm0, 10
|
|
vpshufhw xmm2, [rbx], 10
|
|
vpshufhw xmm2, [rbx+r11*8+256], 10
|
|
vpshufhw xmm2, [rbx+r11*8-256], 10
|
|
vpshufhw xmm2{k5}, xmm0, 10
|
|
vpshufhw xmm2{k5}, [rbx], 10
|
|
vpshufhw xmm2{k5}, [rbx+r11*8+256], 10
|
|
vpshufhw xmm2{k5}, [rbx+r11*8-256], 10
|
|
vpshufhw xmm2{k5}{z}, xmm0, 10
|
|
vpshufhw xmm2{k5}{z}, [rbx], 10
|
|
vpshufhw xmm2{k5}{z}, [rbx+r11*8+256], 10
|
|
vpshufhw xmm2{k5}{z}, [rbx+r11*8-256], 10
|
|
vpshufhw ymm16, ymm15, 10
|
|
vpshufhw ymm16, [rbx], 10
|
|
vpshufhw ymm16, [rbx+r11*8+256], 10
|
|
vpshufhw ymm16, [rbx+r11*8-256], 10
|
|
vpshufhw ymm16{k5}, ymm15, 10
|
|
vpshufhw ymm16{k5}, [rbx], 10
|
|
vpshufhw ymm16{k5}, [rbx+r11*8+256], 10
|
|
vpshufhw ymm16{k5}, [rbx+r11*8-256], 10
|
|
vpshufhw ymm16{k5}{z}, ymm15, 10
|
|
vpshufhw ymm16{k5}{z}, [rbx], 10
|
|
vpshufhw ymm16{k5}{z}, [rbx+r11*8+256], 10
|
|
vpshufhw ymm16{k5}{z}, [rbx+r11*8-256], 10
|
|
vpshufhw zmm24, zmm31, 10
|
|
vpshufhw zmm24, [rbx], 10
|
|
vpshufhw zmm24, [rbx+r11*8+256], 10
|
|
vpshufhw zmm24, [rbx+r11*8-256], 10
|
|
vpshufhw zmm24{k5}, zmm31, 10
|
|
vpshufhw zmm24{k5}, [rbx], 10
|
|
vpshufhw zmm24{k5}, [rbx+r11*8+256], 10
|
|
vpshufhw zmm24{k5}, [rbx+r11*8-256], 10
|
|
vpshufhw zmm24{k5}{z}, zmm31, 10
|
|
vpshufhw zmm24{k5}{z}, [rbx], 10
|
|
vpshufhw zmm24{k5}{z}, [rbx+r11*8+256], 10
|
|
vpshufhw zmm24{k5}{z}, [rbx+r11*8-256], 10
|
|
vpshuflw xmm2, xmm0, 10
|
|
vpshuflw xmm2, [rbx], 10
|
|
vpshuflw xmm2, [rbx+r11*8+256], 10
|
|
vpshuflw xmm2, [rbx+r11*8-256], 10
|
|
vpshuflw xmm2{k5}, xmm0, 10
|
|
vpshuflw xmm2{k5}, [rbx], 10
|
|
vpshuflw xmm2{k5}, [rbx+r11*8+256], 10
|
|
vpshuflw xmm2{k5}, [rbx+r11*8-256], 10
|
|
vpshuflw xmm2{k5}{z}, xmm0, 10
|
|
vpshuflw xmm2{k5}{z}, [rbx], 10
|
|
vpshuflw xmm2{k5}{z}, [rbx+r11*8+256], 10
|
|
vpshuflw xmm2{k5}{z}, [rbx+r11*8-256], 10
|
|
vpshuflw ymm16, ymm15, 10
|
|
vpshuflw ymm16, [rbx], 10
|
|
vpshuflw ymm16, [rbx+r11*8+256], 10
|
|
vpshuflw ymm16, [rbx+r11*8-256], 10
|
|
vpshuflw ymm16{k5}, ymm15, 10
|
|
vpshuflw ymm16{k5}, [rbx], 10
|
|
vpshuflw ymm16{k5}, [rbx+r11*8+256], 10
|
|
vpshuflw ymm16{k5}, [rbx+r11*8-256], 10
|
|
vpshuflw ymm16{k5}{z}, ymm15, 10
|
|
vpshuflw ymm16{k5}{z}, [rbx], 10
|
|
vpshuflw ymm16{k5}{z}, [rbx+r11*8+256], 10
|
|
vpshuflw ymm16{k5}{z}, [rbx+r11*8-256], 10
|
|
vpshuflw zmm24, zmm31, 10
|
|
vpshuflw zmm24, [rbx], 10
|
|
vpshuflw zmm24, [rbx+r11*8+256], 10
|
|
vpshuflw zmm24, [rbx+r11*8-256], 10
|
|
vpshuflw zmm24{k5}, zmm31, 10
|
|
vpshuflw zmm24{k5}, [rbx], 10
|
|
vpshuflw zmm24{k5}, [rbx+r11*8+256], 10
|
|
vpshuflw zmm24{k5}, [rbx+r11*8-256], 10
|
|
vpshuflw zmm24{k5}{z}, zmm31, 10
|
|
vpshuflw zmm24{k5}{z}, [rbx], 10
|
|
vpshuflw zmm24{k5}{z}, [rbx+r11*8+256], 10
|
|
vpshuflw zmm24{k5}{z}, [rbx+r11*8-256], 10
|
|
vpslldq xmm7, xmm0, 10
|
|
vpslldq xmm7, [rbx], 10
|
|
vpslldq xmm7, [rbx+r11*8+256], 10
|
|
vpslldq xmm7, [rbx+r11*8-256], 10
|
|
vpslldq ymm13, ymm15, 10
|
|
vpslldq ymm13, [rbx], 10
|
|
vpslldq ymm13, [rbx+r11*8+256], 10
|
|
vpslldq ymm13, [rbx+r11*8-256], 10
|
|
vpslldq zmm24, zmm31, 10
|
|
vpslldq zmm24, [rbx], 10
|
|
vpslldq zmm24, [rbx+r11*8+256], 10
|
|
vpslldq zmm24, [rbx+r11*8-256], 10
|
|
vpsllvw xmm2, xmm7, xmm0
|
|
vpsllvw xmm2, xmm7, [rbx]
|
|
vpsllvw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsllvw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsllvw xmm2{k5}, xmm7, xmm0
|
|
vpsllvw xmm2{k5}, xmm7, [rbx]
|
|
vpsllvw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsllvw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsllvw xmm2{k5}{z}, xmm7, xmm0
|
|
vpsllvw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsllvw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsllvw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsllvw ymm16, ymm13, ymm15
|
|
vpsllvw ymm16, ymm13, [rbx]
|
|
vpsllvw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsllvw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsllvw ymm16{k5}, ymm13, ymm15
|
|
vpsllvw ymm16{k5}, ymm13, [rbx]
|
|
vpsllvw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsllvw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsllvw ymm16{k5}{z}, ymm13, ymm15
|
|
vpsllvw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsllvw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsllvw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsllvw zmm24, zmm24, zmm31
|
|
vpsllvw zmm24, zmm24, [rbx]
|
|
vpsllvw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsllvw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsllvw zmm24{k5}, zmm24, zmm31
|
|
vpsllvw zmm24{k5}, zmm24, [rbx]
|
|
vpsllvw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsllvw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsllvw zmm24{k5}{z}, zmm24, zmm31
|
|
vpsllvw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsllvw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsllvw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsllw xmm7, xmm0, 10
|
|
vpsllw xmm7, [rbx], 10
|
|
vpsllw xmm7, [rbx+r11*8+256], 10
|
|
vpsllw xmm7, [rbx+r11*8-256], 10
|
|
vpsllw ymm13, ymm15, 10
|
|
vpsllw ymm13, [rbx], 10
|
|
vpsllw ymm13, [rbx+r11*8+256], 10
|
|
vpsllw ymm13, [rbx+r11*8-256], 10
|
|
vpsllw zmm24, zmm31, 10
|
|
vpsllw zmm24, [rbx], 10
|
|
vpsllw zmm24, [rbx+r11*8+256], 10
|
|
vpsllw zmm24, [rbx+r11*8-256], 10
|
|
vpsllw xmm2, xmm7, xmm0
|
|
vpsllw xmm2, xmm7, [rbx]
|
|
vpsllw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsllw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsllw xmm2{k5}, xmm7, xmm0
|
|
vpsllw xmm2{k5}, xmm7, [rbx]
|
|
vpsllw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsllw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsllw xmm2{k5}{z}, xmm7, xmm0
|
|
vpsllw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsllw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsllw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsllw ymm16, ymm13, xmm0
|
|
vpsllw ymm16, ymm13, [rbx]
|
|
vpsllw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsllw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsllw ymm16{k5}, ymm13, xmm0
|
|
vpsllw ymm16{k5}, ymm13, [rbx]
|
|
vpsllw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsllw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsllw ymm16{k5}{z}, ymm13, xmm0
|
|
vpsllw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsllw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsllw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsllw zmm24, zmm24, xmm0
|
|
vpsllw zmm24, zmm24, [rbx]
|
|
vpsllw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsllw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsllw zmm24{k5}, zmm24, xmm0
|
|
vpsllw zmm24{k5}, zmm24, [rbx]
|
|
vpsllw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsllw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsllw zmm24{k5}{z}, zmm24, xmm0
|
|
vpsllw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsllw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsllw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsravw xmm2, xmm7, xmm0
|
|
vpsravw xmm2, xmm7, [rbx]
|
|
vpsravw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsravw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsravw xmm2{k5}, xmm7, xmm0
|
|
vpsravw xmm2{k5}, xmm7, [rbx]
|
|
vpsravw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsravw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsravw xmm2{k5}{z}, xmm7, xmm0
|
|
vpsravw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsravw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsravw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsravw ymm16, ymm13, ymm15
|
|
vpsravw ymm16, ymm13, [rbx]
|
|
vpsravw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsravw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsravw ymm16{k5}, ymm13, ymm15
|
|
vpsravw ymm16{k5}, ymm13, [rbx]
|
|
vpsravw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsravw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsravw ymm16{k5}{z}, ymm13, ymm15
|
|
vpsravw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsravw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsravw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsravw zmm24, zmm24, zmm31
|
|
vpsravw zmm24, zmm24, [rbx]
|
|
vpsravw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsravw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsravw zmm24{k5}, zmm24, zmm31
|
|
vpsravw zmm24{k5}, zmm24, [rbx]
|
|
vpsravw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsravw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsravw zmm24{k5}{z}, zmm24, zmm31
|
|
vpsravw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsravw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsravw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsraw xmm7, xmm0, 10
|
|
vpsraw xmm7, [rbx], 10
|
|
vpsraw xmm7, [rbx+r11*8+256], 10
|
|
vpsraw xmm7, [rbx+r11*8-256], 10
|
|
vpsraw ymm13, ymm15, 10
|
|
vpsraw ymm13, [rbx], 10
|
|
vpsraw ymm13, [rbx+r11*8+256], 10
|
|
vpsraw ymm13, [rbx+r11*8-256], 10
|
|
vpsraw zmm24, zmm31, 10
|
|
vpsraw zmm24, [rbx], 10
|
|
vpsraw zmm24, [rbx+r11*8+256], 10
|
|
vpsraw zmm24, [rbx+r11*8-256], 10
|
|
vpsraw xmm2, xmm7, xmm0
|
|
vpsraw xmm2, xmm7, [rbx]
|
|
vpsraw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsraw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsraw xmm2{k5}, xmm7, xmm0
|
|
vpsraw xmm2{k5}, xmm7, [rbx]
|
|
vpsraw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsraw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsraw xmm2{k5}{z}, xmm7, xmm0
|
|
vpsraw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsraw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsraw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsraw ymm16, ymm13, xmm0
|
|
vpsraw ymm16, ymm13, [rbx]
|
|
vpsraw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsraw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsraw ymm16{k5}, ymm13, xmm0
|
|
vpsraw ymm16{k5}, ymm13, [rbx]
|
|
vpsraw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsraw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsraw ymm16{k5}{z}, ymm13, xmm0
|
|
vpsraw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsraw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsraw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsraw zmm24, zmm24, xmm0
|
|
vpsraw zmm24, zmm24, [rbx]
|
|
vpsraw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsraw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsraw zmm24{k5}, zmm24, xmm0
|
|
vpsraw zmm24{k5}, zmm24, [rbx]
|
|
vpsraw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsraw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsraw zmm24{k5}{z}, zmm24, xmm0
|
|
vpsraw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsraw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsraw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsrldq xmm7, xmm0, 10
|
|
vpsrldq xmm7, [rbx], 10
|
|
vpsrldq xmm7, [rbx+r11*8+256], 10
|
|
vpsrldq xmm7, [rbx+r11*8-256], 10
|
|
vpsrldq ymm13, ymm15, 10
|
|
vpsrldq ymm13, [rbx], 10
|
|
vpsrldq ymm13, [rbx+r11*8+256], 10
|
|
vpsrldq ymm13, [rbx+r11*8-256], 10
|
|
vpsrldq zmm24, zmm31, 10
|
|
vpsrldq zmm24, [rbx], 10
|
|
vpsrldq zmm24, [rbx+r11*8+256], 10
|
|
vpsrldq zmm24, [rbx+r11*8-256], 10
|
|
vpsrlvw xmm2, xmm7, xmm0
|
|
vpsrlvw xmm2, xmm7, [rbx]
|
|
vpsrlvw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsrlvw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsrlvw xmm2{k5}, xmm7, xmm0
|
|
vpsrlvw xmm2{k5}, xmm7, [rbx]
|
|
vpsrlvw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsrlvw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsrlvw xmm2{k5}{z}, xmm7, xmm0
|
|
vpsrlvw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsrlvw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsrlvw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsrlvw ymm16, ymm13, ymm15
|
|
vpsrlvw ymm16, ymm13, [rbx]
|
|
vpsrlvw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsrlvw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsrlvw ymm16{k5}, ymm13, ymm15
|
|
vpsrlvw ymm16{k5}, ymm13, [rbx]
|
|
vpsrlvw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsrlvw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsrlvw ymm16{k5}{z}, ymm13, ymm15
|
|
vpsrlvw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsrlvw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsrlvw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsrlvw zmm24, zmm24, zmm31
|
|
vpsrlvw zmm24, zmm24, [rbx]
|
|
vpsrlvw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsrlvw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsrlvw zmm24{k5}, zmm24, zmm31
|
|
vpsrlvw zmm24{k5}, zmm24, [rbx]
|
|
vpsrlvw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsrlvw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsrlvw zmm24{k5}{z}, zmm24, zmm31
|
|
vpsrlvw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsrlvw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsrlvw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsrlw xmm7, xmm0, 10
|
|
vpsrlw xmm7, [rbx], 10
|
|
vpsrlw xmm7, [rbx+r11*8+256], 10
|
|
vpsrlw xmm7, [rbx+r11*8-256], 10
|
|
vpsrlw ymm13, ymm15, 10
|
|
vpsrlw ymm13, [rbx], 10
|
|
vpsrlw ymm13, [rbx+r11*8+256], 10
|
|
vpsrlw ymm13, [rbx+r11*8-256], 10
|
|
vpsrlw zmm24, zmm31, 10
|
|
vpsrlw zmm24, [rbx], 10
|
|
vpsrlw zmm24, [rbx+r11*8+256], 10
|
|
vpsrlw zmm24, [rbx+r11*8-256], 10
|
|
vpsrlw xmm2, xmm7, xmm0
|
|
vpsrlw xmm2, xmm7, [rbx]
|
|
vpsrlw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsrlw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsrlw xmm2{k5}, xmm7, xmm0
|
|
vpsrlw xmm2{k5}, xmm7, [rbx]
|
|
vpsrlw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsrlw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsrlw xmm2{k5}{z}, xmm7, xmm0
|
|
vpsrlw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsrlw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsrlw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsrlw ymm16, ymm13, xmm0
|
|
vpsrlw ymm16, ymm13, [rbx]
|
|
vpsrlw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsrlw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsrlw ymm16{k5}, ymm13, xmm0
|
|
vpsrlw ymm16{k5}, ymm13, [rbx]
|
|
vpsrlw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsrlw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsrlw ymm16{k5}{z}, ymm13, xmm0
|
|
vpsrlw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsrlw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsrlw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsrlw zmm24, zmm24, xmm0
|
|
vpsrlw zmm24, zmm24, [rbx]
|
|
vpsrlw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsrlw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsrlw zmm24{k5}, zmm24, xmm0
|
|
vpsrlw zmm24{k5}, zmm24, [rbx]
|
|
vpsrlw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsrlw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsrlw zmm24{k5}{z}, zmm24, xmm0
|
|
vpsrlw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsrlw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsrlw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsubb xmm2, xmm7, xmm0
|
|
vpsubb xmm2, xmm7, [rbx]
|
|
vpsubb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsubb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsubb xmm2{k5}, xmm7, xmm0
|
|
vpsubb xmm2{k5}, xmm7, [rbx]
|
|
vpsubb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsubb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsubb xmm2{k5}{z}, xmm7, xmm0
|
|
vpsubb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsubb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsubb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsubb ymm16, ymm13, ymm15
|
|
vpsubb ymm16, ymm13, [rbx]
|
|
vpsubb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsubb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsubb ymm16{k5}, ymm13, ymm15
|
|
vpsubb ymm16{k5}, ymm13, [rbx]
|
|
vpsubb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsubb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsubb ymm16{k5}{z}, ymm13, ymm15
|
|
vpsubb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsubb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsubb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsubb zmm24, zmm24, zmm31
|
|
vpsubb zmm24, zmm24, [rbx]
|
|
vpsubb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsubb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsubb zmm24{k5}, zmm24, zmm31
|
|
vpsubb zmm24{k5}, zmm24, [rbx]
|
|
vpsubb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsubb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsubb zmm24{k5}{z}, zmm24, zmm31
|
|
vpsubb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsubb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsubb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsubsb xmm2, xmm7, xmm0
|
|
vpsubsb xmm2, xmm7, [rbx]
|
|
vpsubsb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsubsb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsubsb xmm2{k5}, xmm7, xmm0
|
|
vpsubsb xmm2{k5}, xmm7, [rbx]
|
|
vpsubsb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsubsb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsubsb xmm2{k5}{z}, xmm7, xmm0
|
|
vpsubsb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsubsb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsubsb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsubsb ymm16, ymm13, ymm15
|
|
vpsubsb ymm16, ymm13, [rbx]
|
|
vpsubsb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsubsb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsubsb ymm16{k5}, ymm13, ymm15
|
|
vpsubsb ymm16{k5}, ymm13, [rbx]
|
|
vpsubsb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsubsb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsubsb ymm16{k5}{z}, ymm13, ymm15
|
|
vpsubsb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsubsb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsubsb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsubsb zmm24, zmm24, zmm31
|
|
vpsubsb zmm24, zmm24, [rbx]
|
|
vpsubsb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsubsb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsubsb zmm24{k5}, zmm24, zmm31
|
|
vpsubsb zmm24{k5}, zmm24, [rbx]
|
|
vpsubsb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsubsb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsubsb zmm24{k5}{z}, zmm24, zmm31
|
|
vpsubsb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsubsb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsubsb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsubsw xmm2, xmm7, xmm0
|
|
vpsubsw xmm2, xmm7, [rbx]
|
|
vpsubsw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsubsw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsubsw xmm2{k5}, xmm7, xmm0
|
|
vpsubsw xmm2{k5}, xmm7, [rbx]
|
|
vpsubsw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsubsw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsubsw xmm2{k5}{z}, xmm7, xmm0
|
|
vpsubsw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsubsw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsubsw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsubsw ymm16, ymm13, ymm15
|
|
vpsubsw ymm16, ymm13, [rbx]
|
|
vpsubsw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsubsw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsubsw ymm16{k5}, ymm13, ymm15
|
|
vpsubsw ymm16{k5}, ymm13, [rbx]
|
|
vpsubsw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsubsw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsubsw ymm16{k5}{z}, ymm13, ymm15
|
|
vpsubsw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsubsw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsubsw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsubsw zmm24, zmm24, zmm31
|
|
vpsubsw zmm24, zmm24, [rbx]
|
|
vpsubsw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsubsw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsubsw zmm24{k5}, zmm24, zmm31
|
|
vpsubsw zmm24{k5}, zmm24, [rbx]
|
|
vpsubsw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsubsw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsubsw zmm24{k5}{z}, zmm24, zmm31
|
|
vpsubsw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsubsw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsubsw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsubusb xmm2, xmm7, xmm0
|
|
vpsubusb xmm2, xmm7, [rbx]
|
|
vpsubusb xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsubusb xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsubusb xmm2{k5}, xmm7, xmm0
|
|
vpsubusb xmm2{k5}, xmm7, [rbx]
|
|
vpsubusb xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsubusb xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsubusb xmm2{k5}{z}, xmm7, xmm0
|
|
vpsubusb xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsubusb xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsubusb xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsubusb ymm16, ymm13, ymm15
|
|
vpsubusb ymm16, ymm13, [rbx]
|
|
vpsubusb ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsubusb ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsubusb ymm16{k5}, ymm13, ymm15
|
|
vpsubusb ymm16{k5}, ymm13, [rbx]
|
|
vpsubusb ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsubusb ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsubusb ymm16{k5}{z}, ymm13, ymm15
|
|
vpsubusb ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsubusb ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsubusb ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsubusb zmm24, zmm24, zmm31
|
|
vpsubusb zmm24, zmm24, [rbx]
|
|
vpsubusb zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsubusb zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsubusb zmm24{k5}, zmm24, zmm31
|
|
vpsubusb zmm24{k5}, zmm24, [rbx]
|
|
vpsubusb zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsubusb zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsubusb zmm24{k5}{z}, zmm24, zmm31
|
|
vpsubusb zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsubusb zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsubusb zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsubusw xmm2, xmm7, xmm0
|
|
vpsubusw xmm2, xmm7, [rbx]
|
|
vpsubusw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsubusw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsubusw xmm2{k5}, xmm7, xmm0
|
|
vpsubusw xmm2{k5}, xmm7, [rbx]
|
|
vpsubusw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsubusw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsubusw xmm2{k5}{z}, xmm7, xmm0
|
|
vpsubusw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsubusw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsubusw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsubusw ymm16, ymm13, ymm15
|
|
vpsubusw ymm16, ymm13, [rbx]
|
|
vpsubusw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsubusw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsubusw ymm16{k5}, ymm13, ymm15
|
|
vpsubusw ymm16{k5}, ymm13, [rbx]
|
|
vpsubusw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsubusw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsubusw ymm16{k5}{z}, ymm13, ymm15
|
|
vpsubusw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsubusw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsubusw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsubusw zmm24, zmm24, zmm31
|
|
vpsubusw zmm24, zmm24, [rbx]
|
|
vpsubusw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsubusw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsubusw zmm24{k5}, zmm24, zmm31
|
|
vpsubusw zmm24{k5}, zmm24, [rbx]
|
|
vpsubusw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsubusw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsubusw zmm24{k5}{z}, zmm24, zmm31
|
|
vpsubusw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsubusw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsubusw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpsubw xmm2, xmm7, xmm0
|
|
vpsubw xmm2, xmm7, [rbx]
|
|
vpsubw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpsubw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpsubw xmm2{k5}, xmm7, xmm0
|
|
vpsubw xmm2{k5}, xmm7, [rbx]
|
|
vpsubw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpsubw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpsubw xmm2{k5}{z}, xmm7, xmm0
|
|
vpsubw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpsubw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpsubw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpsubw ymm16, ymm13, ymm15
|
|
vpsubw ymm16, ymm13, [rbx]
|
|
vpsubw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpsubw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpsubw ymm16{k5}, ymm13, ymm15
|
|
vpsubw ymm16{k5}, ymm13, [rbx]
|
|
vpsubw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpsubw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpsubw ymm16{k5}{z}, ymm13, ymm15
|
|
vpsubw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpsubw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpsubw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpsubw zmm24, zmm24, zmm31
|
|
vpsubw zmm24, zmm24, [rbx]
|
|
vpsubw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpsubw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpsubw zmm24{k5}, zmm24, zmm31
|
|
vpsubw zmm24{k5}, zmm24, [rbx]
|
|
vpsubw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpsubw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpsubw zmm24{k5}{z}, zmm24, zmm31
|
|
vpsubw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpsubw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpsubw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vptestmb k3, xmm7, xmm0
|
|
vptestmb k3, xmm7, [rbx]
|
|
vptestmb k3, xmm7, [rbx+r11*8+256]
|
|
vptestmb k3, xmm7, [rbx+r11*8-256]
|
|
vptestmb k3, ymm13, ymm15
|
|
vptestmb k3, ymm13, [rbx]
|
|
vptestmb k3, ymm13, [rbx+r11*8+256]
|
|
vptestmb k3, ymm13, [rbx+r11*8-256]
|
|
vptestmb k3, zmm24, zmm31
|
|
vptestmb k3, zmm24, [rbx]
|
|
vptestmb k3, zmm24, [rbx+r11*8+256]
|
|
vptestmb k3, zmm24, [rbx+r11*8-256]
|
|
vptestmb k3{k5}, xmm7, xmm0
|
|
vptestmb k3{k5}, xmm7, [rbx]
|
|
vptestmb k3{k5}, xmm7, [rbx+r11*8+256]
|
|
vptestmb k3{k5}, xmm7, [rbx+r11*8-256]
|
|
vptestmb k3{k5}, ymm13, ymm15
|
|
vptestmb k3{k5}, ymm13, [rbx]
|
|
vptestmb k3{k5}, ymm13, [rbx+r11*8+256]
|
|
vptestmb k3{k5}, ymm13, [rbx+r11*8-256]
|
|
vptestmb k3{k5}, zmm24, zmm31
|
|
vptestmb k3{k5}, zmm24, [rbx]
|
|
vptestmb k3{k5}, zmm24, [rbx+r11*8+256]
|
|
vptestmb k3{k5}, zmm24, [rbx+r11*8-256]
|
|
vptestmw k3, xmm7, xmm0
|
|
vptestmw k3, xmm7, [rbx]
|
|
vptestmw k3, xmm7, [rbx+r11*8+256]
|
|
vptestmw k3, xmm7, [rbx+r11*8-256]
|
|
vptestmw k3, ymm13, ymm15
|
|
vptestmw k3, ymm13, [rbx]
|
|
vptestmw k3, ymm13, [rbx+r11*8+256]
|
|
vptestmw k3, ymm13, [rbx+r11*8-256]
|
|
vptestmw k3, zmm24, zmm31
|
|
vptestmw k3, zmm24, [rbx]
|
|
vptestmw k3, zmm24, [rbx+r11*8+256]
|
|
vptestmw k3, zmm24, [rbx+r11*8-256]
|
|
vptestmw k3{k5}, xmm7, xmm0
|
|
vptestmw k3{k5}, xmm7, [rbx]
|
|
vptestmw k3{k5}, xmm7, [rbx+r11*8+256]
|
|
vptestmw k3{k5}, xmm7, [rbx+r11*8-256]
|
|
vptestmw k3{k5}, ymm13, ymm15
|
|
vptestmw k3{k5}, ymm13, [rbx]
|
|
vptestmw k3{k5}, ymm13, [rbx+r11*8+256]
|
|
vptestmw k3{k5}, ymm13, [rbx+r11*8-256]
|
|
vptestmw k3{k5}, zmm24, zmm31
|
|
vptestmw k3{k5}, zmm24, [rbx]
|
|
vptestmw k3{k5}, zmm24, [rbx+r11*8+256]
|
|
vptestmw k3{k5}, zmm24, [rbx+r11*8-256]
|
|
vptestnmb k3, xmm7, xmm0
|
|
vptestnmb k3, xmm7, [rbx]
|
|
vptestnmb k3, xmm7, [rbx+r11*8+256]
|
|
vptestnmb k3, xmm7, [rbx+r11*8-256]
|
|
vptestnmb k3, ymm13, ymm15
|
|
vptestnmb k3, ymm13, [rbx]
|
|
vptestnmb k3, ymm13, [rbx+r11*8+256]
|
|
vptestnmb k3, ymm13, [rbx+r11*8-256]
|
|
vptestnmb k3, zmm24, zmm31
|
|
vptestnmb k3, zmm24, [rbx]
|
|
vptestnmb k3, zmm24, [rbx+r11*8+256]
|
|
vptestnmb k3, zmm24, [rbx+r11*8-256]
|
|
vptestnmb k3{k5}, xmm7, xmm0
|
|
vptestnmb k3{k5}, xmm7, [rbx]
|
|
vptestnmb k3{k5}, xmm7, [rbx+r11*8+256]
|
|
vptestnmb k3{k5}, xmm7, [rbx+r11*8-256]
|
|
vptestnmb k3{k5}, ymm13, ymm15
|
|
vptestnmb k3{k5}, ymm13, [rbx]
|
|
vptestnmb k3{k5}, ymm13, [rbx+r11*8+256]
|
|
vptestnmb k3{k5}, ymm13, [rbx+r11*8-256]
|
|
vptestnmb k3{k5}, zmm24, zmm31
|
|
vptestnmb k3{k5}, zmm24, [rbx]
|
|
vptestnmb k3{k5}, zmm24, [rbx+r11*8+256]
|
|
vptestnmb k3{k5}, zmm24, [rbx+r11*8-256]
|
|
vptestnmw k3, xmm7, xmm0
|
|
vptestnmw k3, xmm7, [rbx]
|
|
vptestnmw k3, xmm7, [rbx+r11*8+256]
|
|
vptestnmw k3, xmm7, [rbx+r11*8-256]
|
|
vptestnmw k3, ymm13, ymm15
|
|
vptestnmw k3, ymm13, [rbx]
|
|
vptestnmw k3, ymm13, [rbx+r11*8+256]
|
|
vptestnmw k3, ymm13, [rbx+r11*8-256]
|
|
vptestnmw k3, zmm24, zmm31
|
|
vptestnmw k3, zmm24, [rbx]
|
|
vptestnmw k3, zmm24, [rbx+r11*8+256]
|
|
vptestnmw k3, zmm24, [rbx+r11*8-256]
|
|
vptestnmw k3{k5}, xmm7, xmm0
|
|
vptestnmw k3{k5}, xmm7, [rbx]
|
|
vptestnmw k3{k5}, xmm7, [rbx+r11*8+256]
|
|
vptestnmw k3{k5}, xmm7, [rbx+r11*8-256]
|
|
vptestnmw k3{k5}, ymm13, ymm15
|
|
vptestnmw k3{k5}, ymm13, [rbx]
|
|
vptestnmw k3{k5}, ymm13, [rbx+r11*8+256]
|
|
vptestnmw k3{k5}, ymm13, [rbx+r11*8-256]
|
|
vptestnmw k3{k5}, zmm24, zmm31
|
|
vptestnmw k3{k5}, zmm24, [rbx]
|
|
vptestnmw k3{k5}, zmm24, [rbx+r11*8+256]
|
|
vptestnmw k3{k5}, zmm24, [rbx+r11*8-256]
|
|
vpunpckhbw xmm2, xmm7, xmm0
|
|
vpunpckhbw xmm2, xmm7, [rbx]
|
|
vpunpckhbw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpunpckhbw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpunpckhbw xmm2{k5}, xmm7, xmm0
|
|
vpunpckhbw xmm2{k5}, xmm7, [rbx]
|
|
vpunpckhbw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpunpckhbw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpunpckhbw xmm2{k5}{z}, xmm7, xmm0
|
|
vpunpckhbw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpunpckhbw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpunpckhbw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpunpckhbw ymm16, ymm13, ymm15
|
|
vpunpckhbw ymm16, ymm13, [rbx]
|
|
vpunpckhbw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpunpckhbw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpunpckhbw ymm16{k5}, ymm13, ymm15
|
|
vpunpckhbw ymm16{k5}, ymm13, [rbx]
|
|
vpunpckhbw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpunpckhbw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpunpckhbw ymm16{k5}{z}, ymm13, ymm15
|
|
vpunpckhbw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpunpckhbw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpunpckhbw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpunpckhbw zmm24, zmm24, zmm31
|
|
vpunpckhbw zmm24, zmm24, [rbx]
|
|
vpunpckhbw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpunpckhbw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpunpckhbw zmm24{k5}, zmm24, zmm31
|
|
vpunpckhbw zmm24{k5}, zmm24, [rbx]
|
|
vpunpckhbw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpunpckhbw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpunpckhbw zmm24{k5}{z}, zmm24, zmm31
|
|
vpunpckhbw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpunpckhbw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpunpckhbw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpunpckhwd xmm2, xmm7, xmm0
|
|
vpunpckhwd xmm2, xmm7, [rbx]
|
|
vpunpckhwd xmm2, xmm7, [rbx+r11*8+256]
|
|
vpunpckhwd xmm2, xmm7, [rbx+r11*8-256]
|
|
vpunpckhwd xmm2{k5}, xmm7, xmm0
|
|
vpunpckhwd xmm2{k5}, xmm7, [rbx]
|
|
vpunpckhwd xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpunpckhwd xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpunpckhwd xmm2{k5}{z}, xmm7, xmm0
|
|
vpunpckhwd xmm2{k5}{z}, xmm7, [rbx]
|
|
vpunpckhwd xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpunpckhwd xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpunpckhwd ymm16, ymm13, ymm15
|
|
vpunpckhwd ymm16, ymm13, [rbx]
|
|
vpunpckhwd ymm16, ymm13, [rbx+r11*8+256]
|
|
vpunpckhwd ymm16, ymm13, [rbx+r11*8-256]
|
|
vpunpckhwd ymm16{k5}, ymm13, ymm15
|
|
vpunpckhwd ymm16{k5}, ymm13, [rbx]
|
|
vpunpckhwd ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpunpckhwd ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpunpckhwd ymm16{k5}{z}, ymm13, ymm15
|
|
vpunpckhwd ymm16{k5}{z}, ymm13, [rbx]
|
|
vpunpckhwd ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpunpckhwd ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpunpckhwd zmm24, zmm24, zmm31
|
|
vpunpckhwd zmm24, zmm24, [rbx]
|
|
vpunpckhwd zmm24, zmm24, [rbx+r11*8+256]
|
|
vpunpckhwd zmm24, zmm24, [rbx+r11*8-256]
|
|
vpunpckhwd zmm24{k5}, zmm24, zmm31
|
|
vpunpckhwd zmm24{k5}, zmm24, [rbx]
|
|
vpunpckhwd zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpunpckhwd zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpunpckhwd zmm24{k5}{z}, zmm24, zmm31
|
|
vpunpckhwd zmm24{k5}{z}, zmm24, [rbx]
|
|
vpunpckhwd zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpunpckhwd zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpunpcklbw xmm2, xmm7, xmm0
|
|
vpunpcklbw xmm2, xmm7, [rbx]
|
|
vpunpcklbw xmm2, xmm7, [rbx+r11*8+256]
|
|
vpunpcklbw xmm2, xmm7, [rbx+r11*8-256]
|
|
vpunpcklbw xmm2{k5}, xmm7, xmm0
|
|
vpunpcklbw xmm2{k5}, xmm7, [rbx]
|
|
vpunpcklbw xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpunpcklbw xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpunpcklbw xmm2{k5}{z}, xmm7, xmm0
|
|
vpunpcklbw xmm2{k5}{z}, xmm7, [rbx]
|
|
vpunpcklbw xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpunpcklbw xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpunpcklbw ymm16, ymm13, ymm15
|
|
vpunpcklbw ymm16, ymm13, [rbx]
|
|
vpunpcklbw ymm16, ymm13, [rbx+r11*8+256]
|
|
vpunpcklbw ymm16, ymm13, [rbx+r11*8-256]
|
|
vpunpcklbw ymm16{k5}, ymm13, ymm15
|
|
vpunpcklbw ymm16{k5}, ymm13, [rbx]
|
|
vpunpcklbw ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpunpcklbw ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpunpcklbw ymm16{k5}{z}, ymm13, ymm15
|
|
vpunpcklbw ymm16{k5}{z}, ymm13, [rbx]
|
|
vpunpcklbw ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpunpcklbw ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpunpcklbw zmm24, zmm24, zmm31
|
|
vpunpcklbw zmm24, zmm24, [rbx]
|
|
vpunpcklbw zmm24, zmm24, [rbx+r11*8+256]
|
|
vpunpcklbw zmm24, zmm24, [rbx+r11*8-256]
|
|
vpunpcklbw zmm24{k5}, zmm24, zmm31
|
|
vpunpcklbw zmm24{k5}, zmm24, [rbx]
|
|
vpunpcklbw zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpunpcklbw zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpunpcklbw zmm24{k5}{z}, zmm24, zmm31
|
|
vpunpcklbw zmm24{k5}{z}, zmm24, [rbx]
|
|
vpunpcklbw zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpunpcklbw zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|
|
vpunpcklwd xmm2, xmm7, xmm0
|
|
vpunpcklwd xmm2, xmm7, [rbx]
|
|
vpunpcklwd xmm2, xmm7, [rbx+r11*8+256]
|
|
vpunpcklwd xmm2, xmm7, [rbx+r11*8-256]
|
|
vpunpcklwd xmm2{k5}, xmm7, xmm0
|
|
vpunpcklwd xmm2{k5}, xmm7, [rbx]
|
|
vpunpcklwd xmm2{k5}, xmm7, [rbx+r11*8+256]
|
|
vpunpcklwd xmm2{k5}, xmm7, [rbx+r11*8-256]
|
|
vpunpcklwd xmm2{k5}{z}, xmm7, xmm0
|
|
vpunpcklwd xmm2{k5}{z}, xmm7, [rbx]
|
|
vpunpcklwd xmm2{k5}{z}, xmm7, [rbx+r11*8+256]
|
|
vpunpcklwd xmm2{k5}{z}, xmm7, [rbx+r11*8-256]
|
|
vpunpcklwd ymm16, ymm13, ymm15
|
|
vpunpcklwd ymm16, ymm13, [rbx]
|
|
vpunpcklwd ymm16, ymm13, [rbx+r11*8+256]
|
|
vpunpcklwd ymm16, ymm13, [rbx+r11*8-256]
|
|
vpunpcklwd ymm16{k5}, ymm13, ymm15
|
|
vpunpcklwd ymm16{k5}, ymm13, [rbx]
|
|
vpunpcklwd ymm16{k5}, ymm13, [rbx+r11*8+256]
|
|
vpunpcklwd ymm16{k5}, ymm13, [rbx+r11*8-256]
|
|
vpunpcklwd ymm16{k5}{z}, ymm13, ymm15
|
|
vpunpcklwd ymm16{k5}{z}, ymm13, [rbx]
|
|
vpunpcklwd ymm16{k5}{z}, ymm13, [rbx+r11*8+256]
|
|
vpunpcklwd ymm16{k5}{z}, ymm13, [rbx+r11*8-256]
|
|
vpunpcklwd zmm24, zmm24, zmm31
|
|
vpunpcklwd zmm24, zmm24, [rbx]
|
|
vpunpcklwd zmm24, zmm24, [rbx+r11*8+256]
|
|
vpunpcklwd zmm24, zmm24, [rbx+r11*8-256]
|
|
vpunpcklwd zmm24{k5}, zmm24, zmm31
|
|
vpunpcklwd zmm24{k5}, zmm24, [rbx]
|
|
vpunpcklwd zmm24{k5}, zmm24, [rbx+r11*8+256]
|
|
vpunpcklwd zmm24{k5}, zmm24, [rbx+r11*8-256]
|
|
vpunpcklwd zmm24{k5}{z}, zmm24, zmm31
|
|
vpunpcklwd zmm24{k5}{z}, zmm24, [rbx]
|
|
vpunpcklwd zmm24{k5}{z}, zmm24, [rbx+r11*8+256]
|
|
vpunpcklwd zmm24{k5}{z}, zmm24, [rbx+r11*8-256]
|