bits 64 kandnw k3, k7, k1 kandw k3, k7, k1 kmovw k3, [rbx] kmovw k3, [rbx+rsi*8+256] kmovw k3, [rbx+rsi*8-256] kmovw k3, k1 kmovw k3, [rbx] kmovw [rbx], k3 kmovw [rbx+rsi*8+256], k3 kmovw [rbx+rsi*8-256], k3 kmovw k3, ecx kmovw ecx, k1 knotw k3, k1 kortestw k3, k1 korw k3, k7, k1 kshiftlw k3, k1, 10 kshiftrw k3, k1, 10 kunpckbw k3, k7, k1 kxnorw k3, k7, k1 kxorw k3, k7, k1 vaddpd xmm2, xmm7, xmm0 vaddpd xmm2, xmm7, [rbx] vaddpd xmm2, xmm7, [rbx]{1to2} vaddpd xmm2, xmm7, [rbx+r11*8+256] vaddpd xmm2, xmm7, [rbx+r11*8-256] vaddpd xmm2{k5}, xmm7, xmm0 vaddpd xmm2{k5}, xmm7, [rbx] vaddpd xmm2{k5}, xmm7, [rbx]{1to2} vaddpd xmm2{k5}, xmm7, [rbx+r11*8+256] vaddpd xmm2{k5}, xmm7, [rbx+r11*8-256] vaddpd xmm2{k5}{z}, xmm7, xmm0 vaddpd xmm2{k5}{z}, xmm7, [rbx] vaddpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vaddpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vaddpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vaddpd ymm16, ymm13, ymm15 vaddpd ymm16, ymm13, [rbx] vaddpd ymm16, ymm13, [rbx]{1to4} vaddpd ymm16, ymm13, [rbx+r11*8+256] vaddpd ymm16, ymm13, [rbx+r11*8-256] vaddpd ymm16{k5}, ymm13, ymm15 vaddpd ymm16{k5}, ymm13, [rbx] vaddpd ymm16{k5}, ymm13, [rbx]{1to4} vaddpd ymm16{k5}, ymm13, [rbx+r11*8+256] vaddpd ymm16{k5}, ymm13, [rbx+r11*8-256] vaddpd ymm16{k5}{z}, ymm13, ymm15 vaddpd ymm16{k5}{z}, ymm13, [rbx] vaddpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vaddpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vaddpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vaddpd zmm24, zmm24, zmm31 vaddpd zmm24, zmm24, zmm31, {rd-sae} vaddpd zmm24, zmm24, [rbx] vaddpd zmm24, zmm24, [rbx]{1to8} vaddpd zmm24, zmm24, [rbx+r11*8+256] vaddpd zmm24, zmm24, [rbx+r11*8-256] vaddpd zmm24{k5}, zmm24, zmm31 vaddpd zmm24{k5}, zmm24, zmm31, {rd-sae} vaddpd zmm24{k5}, zmm24, [rbx] vaddpd zmm24{k5}, zmm24, [rbx]{1to8} vaddpd zmm24{k5}, zmm24, [rbx+r11*8+256] vaddpd zmm24{k5}, zmm24, [rbx+r11*8-256] vaddpd zmm24{k5}{z}, zmm24, zmm31 vaddpd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vaddpd zmm24{k5}{z}, zmm24, [rbx] vaddpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vaddpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vaddpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vaddps xmm2, xmm7, xmm0 vaddps xmm2, xmm7, [rbx] vaddps xmm2, xmm7, [rbx]{1to4} vaddps xmm2, xmm7, [rbx+r11*8+256] vaddps xmm2, xmm7, [rbx+r11*8-256] vaddps xmm2{k5}, xmm7, xmm0 vaddps xmm2{k5}, xmm7, [rbx] vaddps xmm2{k5}, xmm7, [rbx]{1to4} vaddps xmm2{k5}, xmm7, [rbx+r11*8+256] vaddps xmm2{k5}, xmm7, [rbx+r11*8-256] vaddps xmm2{k5}{z}, xmm7, xmm0 vaddps xmm2{k5}{z}, xmm7, [rbx] vaddps xmm2{k5}{z}, xmm7, [rbx]{1to4} vaddps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vaddps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vaddps ymm16, ymm13, ymm15 vaddps ymm16, ymm13, [rbx] vaddps ymm16, ymm13, [rbx]{1to8} vaddps ymm16, ymm13, [rbx+r11*8+256] vaddps ymm16, ymm13, [rbx+r11*8-256] vaddps ymm16{k5}, ymm13, ymm15 vaddps ymm16{k5}, ymm13, [rbx] vaddps ymm16{k5}, ymm13, [rbx]{1to8} vaddps ymm16{k5}, ymm13, [rbx+r11*8+256] vaddps ymm16{k5}, ymm13, [rbx+r11*8-256] vaddps ymm16{k5}{z}, ymm13, ymm15 vaddps ymm16{k5}{z}, ymm13, [rbx] vaddps ymm16{k5}{z}, ymm13, [rbx]{1to8} vaddps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vaddps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vaddps zmm24, zmm24, zmm31 vaddps zmm24, zmm24, zmm31, {rd-sae} vaddps zmm24, zmm24, [rbx] vaddps zmm24, zmm24, [rbx]{1to16} vaddps zmm24, zmm24, [rbx+r11*8+256] vaddps zmm24, zmm24, [rbx+r11*8-256] vaddps zmm24{k5}, zmm24, zmm31 vaddps zmm24{k5}, zmm24, zmm31, {rd-sae} vaddps zmm24{k5}, zmm24, [rbx] vaddps zmm24{k5}, zmm24, [rbx]{1to16} vaddps zmm24{k5}, zmm24, [rbx+r11*8+256] vaddps zmm24{k5}, zmm24, [rbx+r11*8-256] vaddps zmm24{k5}{z}, zmm24, zmm31 vaddps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vaddps zmm24{k5}{z}, zmm24, [rbx] vaddps zmm24{k5}{z}, zmm24, [rbx]{1to16} vaddps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vaddps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vaddsd xmm2, xmm7, xmm0 vaddsd xmm2, xmm7, xmm0, {rd-sae} vaddsd xmm2, xmm7, [rbx] vaddsd xmm2, xmm7, [rbx+r11*8+256] vaddsd xmm2, xmm7, [rbx+r11*8-256] vaddsd xmm2{k5}, xmm7, xmm0 vaddsd xmm2{k5}, xmm7, xmm0, {rd-sae} vaddsd xmm2{k5}, xmm7, [rbx] vaddsd xmm2{k5}, xmm7, [rbx+r11*8+256] vaddsd xmm2{k5}, xmm7, [rbx+r11*8-256] vaddsd xmm2{k5}{z}, xmm7, xmm0 vaddsd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vaddsd xmm2{k5}{z}, xmm7, [rbx] vaddsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vaddsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vaddss xmm2, xmm7, xmm0 vaddss xmm2, xmm7, xmm0, {rd-sae} vaddss xmm2, xmm7, [rbx] vaddss xmm2, xmm7, [rbx+r11*8+256] vaddss xmm2, xmm7, [rbx+r11*8-256] vaddss xmm2{k5}, xmm7, xmm0 vaddss xmm2{k5}, xmm7, xmm0, {rd-sae} vaddss xmm2{k5}, xmm7, [rbx] vaddss xmm2{k5}, xmm7, [rbx+r11*8+256] vaddss xmm2{k5}, xmm7, [rbx+r11*8-256] vaddss xmm2{k5}{z}, xmm7, xmm0 vaddss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vaddss xmm2{k5}{z}, xmm7, [rbx] vaddss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vaddss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] valignd xmm2, xmm7, xmm0, 10 valignd xmm2, xmm7, [rbx], 10 valignd xmm2, xmm7, [rbx]{1to4}, 10 valignd xmm2, xmm7, [rbx+r11*8+256], 10 valignd xmm2, xmm7, [rbx+r11*8-256], 10 valignd xmm2{k5}, xmm7, xmm0, 10 valignd xmm2{k5}, xmm7, [rbx], 10 valignd xmm2{k5}, xmm7, [rbx]{1to4}, 10 valignd xmm2{k5}, xmm7, [rbx+r11*8+256], 10 valignd xmm2{k5}, xmm7, [rbx+r11*8-256], 10 valignd xmm2{k5}{z}, xmm7, xmm0, 10 valignd xmm2{k5}{z}, xmm7, [rbx], 10 valignd xmm2{k5}{z}, xmm7, [rbx]{1to4}, 10 valignd xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 valignd xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 valignd ymm16, ymm13, ymm15, 10 valignd ymm16, ymm13, [rbx], 10 valignd ymm16, ymm13, [rbx]{1to8}, 10 valignd ymm16, ymm13, [rbx+r11*8+256], 10 valignd ymm16, ymm13, [rbx+r11*8-256], 10 valignd ymm16{k5}, ymm13, ymm15, 10 valignd ymm16{k5}, ymm13, [rbx], 10 valignd ymm16{k5}, ymm13, [rbx]{1to8}, 10 valignd ymm16{k5}, ymm13, [rbx+r11*8+256], 10 valignd ymm16{k5}, ymm13, [rbx+r11*8-256], 10 valignd ymm16{k5}{z}, ymm13, ymm15, 10 valignd ymm16{k5}{z}, ymm13, [rbx], 10 valignd ymm16{k5}{z}, ymm13, [rbx]{1to8}, 10 valignd ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 valignd ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 valignd zmm24, zmm24, zmm31, 10 valignd zmm24, zmm24, [rbx], 10 valignd zmm24, zmm24, [rbx]{1to16}, 10 valignd zmm24, zmm24, [rbx+r11*8+256], 10 valignd zmm24, zmm24, [rbx+r11*8-256], 10 valignd zmm24{k5}, zmm24, zmm31, 10 valignd zmm24{k5}, zmm24, [rbx], 10 valignd zmm24{k5}, zmm24, [rbx]{1to16}, 10 valignd zmm24{k5}, zmm24, [rbx+r11*8+256], 10 valignd zmm24{k5}, zmm24, [rbx+r11*8-256], 10 valignd zmm24{k5}{z}, zmm24, zmm31, 10 valignd zmm24{k5}{z}, zmm24, [rbx], 10 valignd zmm24{k5}{z}, zmm24, [rbx]{1to16}, 10 valignd zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 valignd zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 valignq xmm2, xmm7, xmm0, 10 valignq xmm2, xmm7, [rbx], 10 valignq xmm2, xmm7, [rbx]{1to2}, 10 valignq xmm2, xmm7, [rbx+r11*8+256], 10 valignq xmm2, xmm7, [rbx+r11*8-256], 10 valignq xmm2{k5}, xmm7, xmm0, 10 valignq xmm2{k5}, xmm7, [rbx], 10 valignq xmm2{k5}, xmm7, [rbx]{1to2}, 10 valignq xmm2{k5}, xmm7, [rbx+r11*8+256], 10 valignq xmm2{k5}, xmm7, [rbx+r11*8-256], 10 valignq xmm2{k5}{z}, xmm7, xmm0, 10 valignq xmm2{k5}{z}, xmm7, [rbx], 10 valignq xmm2{k5}{z}, xmm7, [rbx]{1to2}, 10 valignq xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 valignq xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 valignq ymm16, ymm13, ymm15, 10 valignq ymm16, ymm13, [rbx], 10 valignq ymm16, ymm13, [rbx]{1to4}, 10 valignq ymm16, ymm13, [rbx+r11*8+256], 10 valignq ymm16, ymm13, [rbx+r11*8-256], 10 valignq ymm16{k5}, ymm13, ymm15, 10 valignq ymm16{k5}, ymm13, [rbx], 10 valignq ymm16{k5}, ymm13, [rbx]{1to4}, 10 valignq ymm16{k5}, ymm13, [rbx+r11*8+256], 10 valignq ymm16{k5}, ymm13, [rbx+r11*8-256], 10 valignq ymm16{k5}{z}, ymm13, ymm15, 10 valignq ymm16{k5}{z}, ymm13, [rbx], 10 valignq ymm16{k5}{z}, ymm13, [rbx]{1to4}, 10 valignq ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 valignq ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 valignq zmm24, zmm24, zmm31, 10 valignq zmm24, zmm24, [rbx], 10 valignq zmm24, zmm24, [rbx]{1to8}, 10 valignq zmm24, zmm24, [rbx+r11*8+256], 10 valignq zmm24, zmm24, [rbx+r11*8-256], 10 valignq zmm24{k5}, zmm24, zmm31, 10 valignq zmm24{k5}, zmm24, [rbx], 10 valignq zmm24{k5}, zmm24, [rbx]{1to8}, 10 valignq zmm24{k5}, zmm24, [rbx+r11*8+256], 10 valignq zmm24{k5}, zmm24, [rbx+r11*8-256], 10 valignq zmm24{k5}{z}, zmm24, zmm31, 10 valignq zmm24{k5}{z}, zmm24, [rbx], 10 valignq zmm24{k5}{z}, zmm24, [rbx]{1to8}, 10 valignq zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 valignq zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vblendmpd xmm2, xmm7, xmm0 vblendmpd xmm2, xmm7, [rbx] vblendmpd xmm2, xmm7, [rbx]{1to2} vblendmpd xmm2, xmm7, [rbx+r11*8+256] vblendmpd xmm2, xmm7, [rbx+r11*8-256] vblendmpd xmm2{k5}, xmm7, xmm0 vblendmpd xmm2{k5}, xmm7, [rbx] vblendmpd xmm2{k5}, xmm7, [rbx]{1to2} vblendmpd xmm2{k5}, xmm7, [rbx+r11*8+256] vblendmpd xmm2{k5}, xmm7, [rbx+r11*8-256] vblendmpd xmm2{k5}{z}, xmm7, xmm0 vblendmpd xmm2{k5}{z}, xmm7, [rbx] vblendmpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vblendmpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vblendmpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vblendmpd ymm16, ymm13, ymm15 vblendmpd ymm16, ymm13, [rbx] vblendmpd ymm16, ymm13, [rbx]{1to4} vblendmpd ymm16, ymm13, [rbx+r11*8+256] vblendmpd ymm16, ymm13, [rbx+r11*8-256] vblendmpd ymm16{k5}, ymm13, ymm15 vblendmpd ymm16{k5}, ymm13, [rbx] vblendmpd ymm16{k5}, ymm13, [rbx]{1to4} vblendmpd ymm16{k5}, ymm13, [rbx+r11*8+256] vblendmpd ymm16{k5}, ymm13, [rbx+r11*8-256] vblendmpd ymm16{k5}{z}, ymm13, ymm15 vblendmpd ymm16{k5}{z}, ymm13, [rbx] vblendmpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vblendmpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vblendmpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vblendmpd zmm24, zmm24, zmm31 vblendmpd zmm24, zmm24, [rbx] vblendmpd zmm24, zmm24, [rbx]{1to8} vblendmpd zmm24, zmm24, [rbx+r11*8+256] vblendmpd zmm24, zmm24, [rbx+r11*8-256] vblendmpd zmm24{k5}, zmm24, zmm31 vblendmpd zmm24{k5}, zmm24, [rbx] vblendmpd zmm24{k5}, zmm24, [rbx]{1to8} vblendmpd zmm24{k5}, zmm24, [rbx+r11*8+256] vblendmpd zmm24{k5}, zmm24, [rbx+r11*8-256] vblendmpd zmm24{k5}{z}, zmm24, zmm31 vblendmpd zmm24{k5}{z}, zmm24, [rbx] vblendmpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vblendmpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vblendmpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vblendmps xmm2, xmm7, xmm0 vblendmps xmm2, xmm7, [rbx] vblendmps xmm2, xmm7, [rbx]{1to4} vblendmps xmm2, xmm7, [rbx+r11*8+256] vblendmps xmm2, xmm7, [rbx+r11*8-256] vblendmps xmm2{k5}, xmm7, xmm0 vblendmps xmm2{k5}, xmm7, [rbx] vblendmps xmm2{k5}, xmm7, [rbx]{1to4} vblendmps xmm2{k5}, xmm7, [rbx+r11*8+256] vblendmps xmm2{k5}, xmm7, [rbx+r11*8-256] vblendmps xmm2{k5}{z}, xmm7, xmm0 vblendmps xmm2{k5}{z}, xmm7, [rbx] vblendmps xmm2{k5}{z}, xmm7, [rbx]{1to4} vblendmps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vblendmps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vblendmps ymm16, ymm13, ymm15 vblendmps ymm16, ymm13, [rbx] vblendmps ymm16, ymm13, [rbx]{1to8} vblendmps ymm16, ymm13, [rbx+r11*8+256] vblendmps ymm16, ymm13, [rbx+r11*8-256] vblendmps ymm16{k5}, ymm13, ymm15 vblendmps ymm16{k5}, ymm13, [rbx] vblendmps ymm16{k5}, ymm13, [rbx]{1to8} vblendmps ymm16{k5}, ymm13, [rbx+r11*8+256] vblendmps ymm16{k5}, ymm13, [rbx+r11*8-256] vblendmps ymm16{k5}{z}, ymm13, ymm15 vblendmps ymm16{k5}{z}, ymm13, [rbx] vblendmps ymm16{k5}{z}, ymm13, [rbx]{1to8} vblendmps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vblendmps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vblendmps zmm24, zmm24, zmm31 vblendmps zmm24, zmm24, [rbx] vblendmps zmm24, zmm24, [rbx]{1to16} vblendmps zmm24, zmm24, [rbx+r11*8+256] vblendmps zmm24, zmm24, [rbx+r11*8-256] vblendmps zmm24{k5}, zmm24, zmm31 vblendmps zmm24{k5}, zmm24, [rbx] vblendmps zmm24{k5}, zmm24, [rbx]{1to16} vblendmps zmm24{k5}, zmm24, [rbx+r11*8+256] vblendmps zmm24{k5}, zmm24, [rbx+r11*8-256] vblendmps zmm24{k5}{z}, zmm24, zmm31 vblendmps zmm24{k5}{z}, zmm24, [rbx] vblendmps zmm24{k5}{z}, zmm24, [rbx]{1to16} vblendmps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vblendmps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vbroadcastf32x4 ymm16, [rbx] vbroadcastf32x4 ymm16, [rbx+rsi*8+256] vbroadcastf32x4 ymm16, [rbx+rsi*8-256] vbroadcastf32x4 ymm16{k5}, [rbx] vbroadcastf32x4 ymm16{k5}, [rbx+rsi*8+256] vbroadcastf32x4 ymm16{k5}, [rbx+rsi*8-256] vbroadcastf32x4 ymm16{k5}{z}, [rbx] vbroadcastf32x4 ymm16{k5}{z}, [rbx+rsi*8+256] vbroadcastf32x4 ymm16{k5}{z}, [rbx+rsi*8-256] vbroadcastf32x4 zmm24, [rbx] vbroadcastf32x4 zmm24, [rbx+rsi*8+256] vbroadcastf32x4 zmm24, [rbx+rsi*8-256] vbroadcastf32x4 zmm24{k5}, [rbx] vbroadcastf32x4 zmm24{k5}, [rbx+rsi*8+256] vbroadcastf32x4 zmm24{k5}, [rbx+rsi*8-256] vbroadcastf32x4 zmm24{k5}{z}, [rbx] vbroadcastf32x4 zmm24{k5}{z}, [rbx+rsi*8+256] vbroadcastf32x4 zmm24{k5}{z}, [rbx+rsi*8-256] vbroadcastf64x4 zmm24, [rbx] vbroadcastf64x4 zmm24, [rbx+rsi*8+256] vbroadcastf64x4 zmm24, [rbx+rsi*8-256] vbroadcastf64x4 zmm24{k5}, [rbx] vbroadcastf64x4 zmm24{k5}, [rbx+rsi*8+256] vbroadcastf64x4 zmm24{k5}, [rbx+rsi*8-256] vbroadcastf64x4 zmm24{k5}{z}, [rbx] vbroadcastf64x4 zmm24{k5}{z}, [rbx+rsi*8+256] vbroadcastf64x4 zmm24{k5}{z}, [rbx+rsi*8-256] vbroadcasti32x4 ymm16, [rbx] vbroadcasti32x4 ymm16, [rbx+rsi*8+256] vbroadcasti32x4 ymm16, [rbx+rsi*8-256] vbroadcasti32x4 ymm16{k5}, [rbx] vbroadcasti32x4 ymm16{k5}, [rbx+rsi*8+256] vbroadcasti32x4 ymm16{k5}, [rbx+rsi*8-256] vbroadcasti32x4 ymm16{k5}{z}, [rbx] vbroadcasti32x4 ymm16{k5}{z}, [rbx+rsi*8+256] vbroadcasti32x4 ymm16{k5}{z}, [rbx+rsi*8-256] vbroadcasti32x4 zmm24, [rbx] vbroadcasti32x4 zmm24, [rbx+rsi*8+256] vbroadcasti32x4 zmm24, [rbx+rsi*8-256] vbroadcasti32x4 zmm24{k5}, [rbx] vbroadcasti32x4 zmm24{k5}, [rbx+rsi*8+256] vbroadcasti32x4 zmm24{k5}, [rbx+rsi*8-256] vbroadcasti32x4 zmm24{k5}{z}, [rbx] vbroadcasti32x4 zmm24{k5}{z}, [rbx+rsi*8+256] vbroadcasti32x4 zmm24{k5}{z}, [rbx+rsi*8-256] vbroadcasti64x4 zmm24, [rbx] vbroadcasti64x4 zmm24, [rbx+rsi*8+256] vbroadcasti64x4 zmm24, [rbx+rsi*8-256] vbroadcasti64x4 zmm24{k5}, [rbx] vbroadcasti64x4 zmm24{k5}, [rbx+rsi*8+256] vbroadcasti64x4 zmm24{k5}, [rbx+rsi*8-256] vbroadcasti64x4 zmm24{k5}{z}, [rbx] vbroadcasti64x4 zmm24{k5}{z}, [rbx+rsi*8+256] vbroadcasti64x4 zmm24{k5}{z}, [rbx+rsi*8-256] vbroadcastsd ymm16, xmm0 vbroadcastsd ymm16, [rbx] vbroadcastsd ymm16, [rbx+r11*8+256] vbroadcastsd ymm16, [rbx+r11*8-256] vbroadcastsd ymm16{k5}, xmm0 vbroadcastsd ymm16{k5}, [rbx] vbroadcastsd ymm16{k5}, [rbx+r11*8+256] vbroadcastsd ymm16{k5}, [rbx+r11*8-256] vbroadcastsd ymm16{k5}{z}, xmm0 vbroadcastsd ymm16{k5}{z}, [rbx] vbroadcastsd ymm16{k5}{z}, [rbx+r11*8+256] vbroadcastsd ymm16{k5}{z}, [rbx+r11*8-256] vbroadcastsd zmm24, xmm0 vbroadcastsd zmm24, [rbx] vbroadcastsd zmm24, [rbx+r11*8+256] vbroadcastsd zmm24, [rbx+r11*8-256] vbroadcastsd zmm24{k5}, xmm0 vbroadcastsd zmm24{k5}, [rbx] vbroadcastsd zmm24{k5}, [rbx+r11*8+256] vbroadcastsd zmm24{k5}, [rbx+r11*8-256] vbroadcastsd zmm24{k5}{z}, xmm0 vbroadcastsd zmm24{k5}{z}, [rbx] vbroadcastsd zmm24{k5}{z}, [rbx+r11*8+256] vbroadcastsd zmm24{k5}{z}, [rbx+r11*8-256] vbroadcastss xmm2, xmm0 vbroadcastss xmm2, [rbx] vbroadcastss xmm2, [rbx+r11*8+256] vbroadcastss xmm2, [rbx+r11*8-256] vbroadcastss xmm2{k5}, xmm0 vbroadcastss xmm2{k5}, [rbx] vbroadcastss xmm2{k5}, [rbx+r11*8+256] vbroadcastss xmm2{k5}, [rbx+r11*8-256] vbroadcastss xmm2{k5}{z}, xmm0 vbroadcastss xmm2{k5}{z}, [rbx] vbroadcastss xmm2{k5}{z}, [rbx+r11*8+256] vbroadcastss xmm2{k5}{z}, [rbx+r11*8-256] vbroadcastss ymm16, xmm0 vbroadcastss ymm16, [rbx] vbroadcastss ymm16, [rbx+r11*8+256] vbroadcastss ymm16, [rbx+r11*8-256] vbroadcastss ymm16{k5}, xmm0 vbroadcastss ymm16{k5}, [rbx] vbroadcastss ymm16{k5}, [rbx+r11*8+256] vbroadcastss ymm16{k5}, [rbx+r11*8-256] vbroadcastss ymm16{k5}{z}, xmm0 vbroadcastss ymm16{k5}{z}, [rbx] vbroadcastss ymm16{k5}{z}, [rbx+r11*8+256] vbroadcastss ymm16{k5}{z}, [rbx+r11*8-256] vbroadcastss zmm24, xmm0 vbroadcastss zmm24, [rbx] vbroadcastss zmm24, [rbx+r11*8+256] vbroadcastss zmm24, [rbx+r11*8-256] vbroadcastss zmm24{k5}, xmm0 vbroadcastss zmm24{k5}, [rbx] vbroadcastss zmm24{k5}, [rbx+r11*8+256] vbroadcastss zmm24{k5}, [rbx+r11*8-256] vbroadcastss zmm24{k5}{z}, xmm0 vbroadcastss zmm24{k5}{z}, [rbx] vbroadcastss zmm24{k5}{z}, [rbx+r11*8+256] vbroadcastss zmm24{k5}{z}, [rbx+r11*8-256] vcmppd k3, xmm7, xmm0, 10 vcmppd k3, xmm7, [rbx], 10 vcmppd k3, xmm7, [rbx]{1to2}, 10 vcmppd k3, xmm7, [rbx+r11*8+256], 10 vcmppd k3, xmm7, [rbx+r11*8-256], 10 vcmppd k3, ymm13, ymm15, 10 vcmppd k3, ymm13, [rbx], 10 vcmppd k3, ymm13, [rbx]{1to4}, 10 vcmppd k3, ymm13, [rbx+r11*8+256], 10 vcmppd k3, ymm13, [rbx+r11*8-256], 10 vcmppd k3, zmm24, zmm31, 10 vcmppd k3, zmm24, [rbx], 10 vcmppd k3, zmm24, [rbx]{1to8}, 10 vcmppd k3, zmm24, [rbx+r11*8+256], 10 vcmppd k3, zmm24, [rbx+r11*8-256], 10 vcmppd k3{k5}, xmm7, xmm0, 10 vcmppd k3{k5}, xmm7, [rbx], 10 vcmppd k3{k5}, xmm7, [rbx]{1to2}, 10 vcmppd k3{k5}, xmm7, [rbx+r11*8+256], 10 vcmppd k3{k5}, xmm7, [rbx+r11*8-256], 10 vcmppd k3{k5}, ymm13, ymm15, 10 vcmppd k3{k5}, ymm13, [rbx], 10 vcmppd k3{k5}, ymm13, [rbx]{1to4}, 10 vcmppd k3{k5}, ymm13, [rbx+r11*8+256], 10 vcmppd k3{k5}, ymm13, [rbx+r11*8-256], 10 vcmppd k3{k5}, zmm24, zmm31, 10 vcmppd k3{k5}, zmm24, [rbx], 10 vcmppd k3{k5}, zmm24, [rbx]{1to8}, 10 vcmppd k3{k5}, zmm24, [rbx+r11*8+256], 10 vcmppd k3{k5}, zmm24, [rbx+r11*8-256], 10 vcmpps k3, xmm7, xmm0, 10 vcmpps k3, xmm7, [rbx], 10 vcmpps k3, xmm7, [rbx]{1to4}, 10 vcmpps k3, xmm7, [rbx+r11*8+256], 10 vcmpps k3, xmm7, [rbx+r11*8-256], 10 vcmpps k3, ymm13, ymm15, 10 vcmpps k3, ymm13, [rbx], 10 vcmpps k3, ymm13, [rbx]{1to8}, 10 vcmpps k3, ymm13, [rbx+r11*8+256], 10 vcmpps k3, ymm13, [rbx+r11*8-256], 10 vcmpps k3, zmm24, zmm31, 10 vcmpps k3, zmm24, [rbx], 10 vcmpps k3, zmm24, [rbx]{1to16}, 10 vcmpps k3, zmm24, [rbx+r11*8+256], 10 vcmpps k3, zmm24, [rbx+r11*8-256], 10 vcmpps k3{k5}, xmm7, xmm0, 10 vcmpps k3{k5}, xmm7, [rbx], 10 vcmpps k3{k5}, xmm7, [rbx]{1to4}, 10 vcmpps k3{k5}, xmm7, [rbx+r11*8+256], 10 vcmpps k3{k5}, xmm7, [rbx+r11*8-256], 10 vcmpps k3{k5}, ymm13, ymm15, 10 vcmpps k3{k5}, ymm13, [rbx], 10 vcmpps k3{k5}, ymm13, [rbx]{1to8}, 10 vcmpps k3{k5}, ymm13, [rbx+r11*8+256], 10 vcmpps k3{k5}, ymm13, [rbx+r11*8-256], 10 vcmpps k3{k5}, zmm24, zmm31, 10 vcmpps k3{k5}, zmm24, [rbx], 10 vcmpps k3{k5}, zmm24, [rbx]{1to16}, 10 vcmpps k3{k5}, zmm24, [rbx+r11*8+256], 10 vcmpps k3{k5}, zmm24, [rbx+r11*8-256], 10 vcmpsd k3, xmm7, xmm0, 10 vcmpsd k3, xmm7, [rbx], 10 vcmpsd k3, xmm7, [rbx+r11*8+256], 10 vcmpsd k3, xmm7, [rbx+r11*8-256], 10 vcmpsd k3{k5}, xmm7, xmm0, 10 vcmpsd k3{k5}, xmm7, [rbx], 10 vcmpsd k3{k5}, xmm7, [rbx+r11*8+256], 10 vcmpsd k3{k5}, xmm7, [rbx+r11*8-256], 10 vcmpss k3, xmm7, xmm0, 10 vcmpss k3, xmm7, [rbx], 10 vcmpss k3, xmm7, [rbx+r11*8+256], 10 vcmpss k3, xmm7, [rbx+r11*8-256], 10 vcmpss k3{k5}, xmm7, xmm0, 10 vcmpss k3{k5}, xmm7, [rbx], 10 vcmpss k3{k5}, xmm7, [rbx+r11*8+256], 10 vcmpss k3{k5}, xmm7, [rbx+r11*8-256], 10 vcomisd xmm2, xmm0 vcomisd xmm2, xmm0, {sae} vcomisd xmm2, [rbx] vcomisd xmm2, [rbx+r11*8+256] vcomisd xmm2, [rbx+r11*8-256] vcomiss xmm2, xmm0 vcomiss xmm2, xmm0, {sae} vcomiss xmm2, [rbx] vcomiss xmm2, [rbx+r11*8+256] vcomiss xmm2, [rbx+r11*8-256] vcompresspd xmm0, xmm2 vcompresspd ymm15, ymm16 vcompresspd zmm31, zmm24 vcompresspd [rbx], xmm2 vcompresspd [rbx], ymm16 vcompresspd [rbx], zmm24 vcompresspd [rbx+r11*8+256], xmm2 vcompresspd [rbx+r11*8+256], ymm16 vcompresspd [rbx+r11*8+256], zmm24 vcompresspd [rbx+r11*8-256], xmm2 vcompresspd [rbx+r11*8-256], ymm16 vcompresspd [rbx+r11*8-256], zmm24 vcompressps xmm0, xmm2 vcompressps ymm15, ymm16 vcompressps zmm31, zmm24 vcompressps [rbx], xmm2 vcompressps [rbx], ymm16 vcompressps [rbx], zmm24 vcompressps [rbx+r11*8+256], xmm2 vcompressps [rbx+r11*8+256], ymm16 vcompressps [rbx+r11*8+256], zmm24 vcompressps [rbx+r11*8-256], xmm2 vcompressps [rbx+r11*8-256], ymm16 vcompressps [rbx+r11*8-256], zmm24 vcvtdq2pd xmm2, xmm0 vcvtdq2pd xmm2, [rbx] vcvtdq2pd xmm2, [rbx]{1to2} vcvtdq2pd xmm2, [rbx+r11*8+256] vcvtdq2pd xmm2, [rbx+r11*8-256] vcvtdq2pd xmm2{k5}, xmm0 vcvtdq2pd xmm2{k5}, [rbx] vcvtdq2pd xmm2{k5}, [rbx]{1to2} vcvtdq2pd xmm2{k5}, [rbx+r11*8+256] vcvtdq2pd xmm2{k5}, [rbx+r11*8-256] vcvtdq2pd xmm2{k5}{z}, xmm0 vcvtdq2pd xmm2{k5}{z}, [rbx] vcvtdq2pd xmm2{k5}{z}, [rbx]{1to2} vcvtdq2pd xmm2{k5}{z}, [rbx+r11*8+256] vcvtdq2pd xmm2{k5}{z}, [rbx+r11*8-256] vcvtdq2pd ymm16, xmm0 vcvtdq2pd ymm16, [rbx] vcvtdq2pd ymm16, [rbx]{1to4} vcvtdq2pd ymm16, [rbx+r11*8+256] vcvtdq2pd ymm16, [rbx+r11*8-256] vcvtdq2pd ymm16{k5}, xmm0 vcvtdq2pd ymm16{k5}, [rbx] vcvtdq2pd ymm16{k5}, [rbx]{1to4} vcvtdq2pd ymm16{k5}, [rbx+r11*8+256] vcvtdq2pd ymm16{k5}, [rbx+r11*8-256] vcvtdq2pd ymm16{k5}{z}, xmm0 vcvtdq2pd ymm16{k5}{z}, [rbx] vcvtdq2pd ymm16{k5}{z}, [rbx]{1to4} vcvtdq2pd ymm16{k5}{z}, [rbx+r11*8+256] vcvtdq2pd ymm16{k5}{z}, [rbx+r11*8-256] vcvtdq2pd zmm24, ymm15 vcvtdq2pd zmm24, [rbx] vcvtdq2pd zmm24, [rbx]{1to8} vcvtdq2pd zmm24, [rbx+r11*8+256] vcvtdq2pd zmm24, [rbx+r11*8-256] vcvtdq2pd zmm24{k5}, ymm15 vcvtdq2pd zmm24{k5}, [rbx] vcvtdq2pd zmm24{k5}, [rbx]{1to8} vcvtdq2pd zmm24{k5}, [rbx+r11*8+256] vcvtdq2pd zmm24{k5}, [rbx+r11*8-256] vcvtdq2pd zmm24{k5}{z}, ymm15 vcvtdq2pd zmm24{k5}{z}, [rbx] vcvtdq2pd zmm24{k5}{z}, [rbx]{1to8} vcvtdq2pd zmm24{k5}{z}, [rbx+r11*8+256] vcvtdq2pd zmm24{k5}{z}, [rbx+r11*8-256] vcvtdq2ps xmm2, xmm0 vcvtdq2ps xmm2, [rbx] vcvtdq2ps xmm2, [rbx]{1to4} vcvtdq2ps xmm2, [rbx+r11*8+256] vcvtdq2ps xmm2, [rbx+r11*8-256] vcvtdq2ps xmm2{k5}, xmm0 vcvtdq2ps xmm2{k5}, [rbx] vcvtdq2ps xmm2{k5}, [rbx]{1to4} vcvtdq2ps xmm2{k5}, [rbx+r11*8+256] vcvtdq2ps xmm2{k5}, [rbx+r11*8-256] vcvtdq2ps xmm2{k5}{z}, xmm0 vcvtdq2ps xmm2{k5}{z}, [rbx] vcvtdq2ps xmm2{k5}{z}, [rbx]{1to4} vcvtdq2ps xmm2{k5}{z}, [rbx+r11*8+256] vcvtdq2ps xmm2{k5}{z}, [rbx+r11*8-256] vcvtdq2ps ymm16, ymm15 vcvtdq2ps ymm16, [rbx] vcvtdq2ps ymm16, [rbx]{1to8} vcvtdq2ps ymm16, [rbx+r11*8+256] vcvtdq2ps ymm16, [rbx+r11*8-256] vcvtdq2ps ymm16{k5}, ymm15 vcvtdq2ps ymm16{k5}, [rbx] vcvtdq2ps ymm16{k5}, [rbx]{1to8} vcvtdq2ps ymm16{k5}, [rbx+r11*8+256] vcvtdq2ps ymm16{k5}, [rbx+r11*8-256] vcvtdq2ps ymm16{k5}{z}, ymm15 vcvtdq2ps ymm16{k5}{z}, [rbx] vcvtdq2ps ymm16{k5}{z}, [rbx]{1to8} vcvtdq2ps ymm16{k5}{z}, [rbx+r11*8+256] vcvtdq2ps ymm16{k5}{z}, [rbx+r11*8-256] vcvtdq2ps zmm24, zmm31 vcvtdq2ps zmm24, zmm31, {rd-sae} vcvtdq2ps zmm24, [rbx] vcvtdq2ps zmm24, [rbx]{1to16} vcvtdq2ps zmm24, [rbx+r11*8+256] vcvtdq2ps zmm24, [rbx+r11*8-256] vcvtdq2ps zmm24{k5}, zmm31 vcvtdq2ps zmm24{k5}, zmm31, {rd-sae} vcvtdq2ps zmm24{k5}, [rbx] vcvtdq2ps zmm24{k5}, [rbx]{1to16} vcvtdq2ps zmm24{k5}, [rbx+r11*8+256] vcvtdq2ps zmm24{k5}, [rbx+r11*8-256] vcvtdq2ps zmm24{k5}{z}, zmm31 vcvtdq2ps zmm24{k5}{z}, zmm31, {rd-sae} vcvtdq2ps zmm24{k5}{z}, [rbx] vcvtdq2ps zmm24{k5}{z}, [rbx]{1to16} vcvtdq2ps zmm24{k5}{z}, [rbx+r11*8+256] vcvtdq2ps zmm24{k5}{z}, [rbx+r11*8-256] vcvtpd2dq xmm2, xmm0 vcvtpd2dq xmm2, ymm15 vcvtpd2dq xmm2, [rbx] vcvtpd2dq xmm2, [rbx]{1to2} vcvtpd2dq xmm2, [rbx]{1to4} vcvtpd2dq xmm2, [rbx+r11*8+256] vcvtpd2dq xmm2, [rbx+r11*8-256] vcvtpd2dq xmm2{k5}, xmm0 vcvtpd2dq xmm2{k5}, ymm15 vcvtpd2dq xmm2{k5}, [rbx]{1to2} vcvtpd2dq xmm2{k5}, [rbx]{1to4} vcvtpd2dq xmm2{k5}{z}, xmm0 vcvtpd2dq xmm2{k5}{z}, ymm15 vcvtpd2dq xmm2{k5}{z}, [rbx]{1to2} vcvtpd2dq xmm2{k5}{z}, [rbx]{1to4} vcvtpd2dq ymm16, zmm31 vcvtpd2dq ymm16, zmm31, {rd-sae} vcvtpd2dq ymm16, [rbx] vcvtpd2dq ymm16, [rbx]{1to8} vcvtpd2dq ymm16, [rbx+r11*8+256] vcvtpd2dq ymm16, [rbx+r11*8-256] vcvtpd2dq ymm16{k5}, zmm31 vcvtpd2dq ymm16{k5}, zmm31, {rd-sae} vcvtpd2dq ymm16{k5}, [rbx] vcvtpd2dq ymm16{k5}, [rbx]{1to8} vcvtpd2dq ymm16{k5}, [rbx+r11*8+256] vcvtpd2dq ymm16{k5}, [rbx+r11*8-256] vcvtpd2dq ymm16{k5}{z}, zmm31 vcvtpd2dq ymm16{k5}{z}, zmm31, {rd-sae} vcvtpd2dq ymm16{k5}{z}, [rbx] vcvtpd2dq ymm16{k5}{z}, [rbx]{1to8} vcvtpd2dq ymm16{k5}{z}, [rbx+r11*8+256] vcvtpd2dq ymm16{k5}{z}, [rbx+r11*8-256] vcvtpd2ps xmm2, xmm0 vcvtpd2ps xmm2, ymm15 vcvtpd2ps xmm2, [rbx] vcvtpd2ps xmm2, [rbx]{1to2} vcvtpd2ps xmm2, [rbx]{1to4} vcvtpd2ps xmm2, [rbx+r11*8+256] vcvtpd2ps xmm2, [rbx+r11*8-256] vcvtpd2ps xmm2{k5}, xmm0 vcvtpd2ps xmm2{k5}, ymm15 vcvtpd2ps xmm2{k5}, [rbx]{1to2} vcvtpd2ps xmm2{k5}, [rbx]{1to4} vcvtpd2ps xmm2{k5}{z}, xmm0 vcvtpd2ps xmm2{k5}{z}, ymm15 vcvtpd2ps xmm2{k5}{z}, [rbx]{1to2} vcvtpd2ps xmm2{k5}{z}, [rbx]{1to4} vcvtpd2ps ymm16, zmm31 vcvtpd2ps ymm16, zmm31, {rd-sae} vcvtpd2ps ymm16, [rbx] vcvtpd2ps ymm16, [rbx]{1to8} vcvtpd2ps ymm16, [rbx+r11*8+256] vcvtpd2ps ymm16, [rbx+r11*8-256] vcvtpd2ps ymm16{k5}, zmm31 vcvtpd2ps ymm16{k5}, zmm31, {rd-sae} vcvtpd2ps ymm16{k5}, [rbx] vcvtpd2ps ymm16{k5}, [rbx]{1to8} vcvtpd2ps ymm16{k5}, [rbx+r11*8+256] vcvtpd2ps ymm16{k5}, [rbx+r11*8-256] vcvtpd2ps ymm16{k5}{z}, zmm31 vcvtpd2ps ymm16{k5}{z}, zmm31, {rd-sae} vcvtpd2ps ymm16{k5}{z}, [rbx] vcvtpd2ps ymm16{k5}{z}, [rbx]{1to8} vcvtpd2ps ymm16{k5}{z}, [rbx+r11*8+256] vcvtpd2ps ymm16{k5}{z}, [rbx+r11*8-256] vcvtpd2udq xmm2, xmm0 vcvtpd2udq xmm2, ymm15 vcvtpd2udq xmm2, [rbx]{1to2} vcvtpd2udq xmm2, [rbx]{1to4} vcvtpd2udq xmm2{k5}, xmm0 vcvtpd2udq xmm2{k5}, ymm15 vcvtpd2udq xmm2{k5}, [rbx]{1to2} vcvtpd2udq xmm2{k5}, [rbx]{1to4} vcvtpd2udq xmm2{k5}{z}, xmm0 vcvtpd2udq xmm2{k5}{z}, ymm15 vcvtpd2udq xmm2{k5}{z}, [rbx]{1to2} vcvtpd2udq xmm2{k5}{z}, [rbx]{1to4} vcvtpd2udq ymm16, zmm31 vcvtpd2udq ymm16, zmm31, {rd-sae} vcvtpd2udq ymm16, [rbx] vcvtpd2udq ymm16, [rbx]{1to8} vcvtpd2udq ymm16, [rbx+r11*8+256] vcvtpd2udq ymm16, [rbx+r11*8-256] vcvtpd2udq ymm16{k5}, zmm31 vcvtpd2udq ymm16{k5}, zmm31, {rd-sae} vcvtpd2udq ymm16{k5}, [rbx] vcvtpd2udq ymm16{k5}, [rbx]{1to8} vcvtpd2udq ymm16{k5}, [rbx+r11*8+256] vcvtpd2udq ymm16{k5}, [rbx+r11*8-256] vcvtpd2udq ymm16{k5}{z}, zmm31 vcvtpd2udq ymm16{k5}{z}, zmm31, {rd-sae} vcvtpd2udq ymm16{k5}{z}, [rbx] vcvtpd2udq ymm16{k5}{z}, [rbx]{1to8} vcvtpd2udq ymm16{k5}{z}, [rbx+r11*8+256] vcvtpd2udq ymm16{k5}{z}, [rbx+r11*8-256] vcvtph2ps xmm2, xmm0 vcvtph2ps xmm2, [rbx] vcvtph2ps xmm2, [rbx+r11*8+256] vcvtph2ps xmm2, [rbx+r11*8-256] vcvtph2ps xmm2{k5}, xmm0 vcvtph2ps xmm2{k5}, [rbx] vcvtph2ps xmm2{k5}, [rbx+r11*8+256] vcvtph2ps xmm2{k5}, [rbx+r11*8-256] vcvtph2ps xmm2{k5}{z}, xmm0 vcvtph2ps xmm2{k5}{z}, [rbx] vcvtph2ps xmm2{k5}{z}, [rbx+r11*8+256] vcvtph2ps xmm2{k5}{z}, [rbx+r11*8-256] vcvtph2ps ymm16, xmm0 vcvtph2ps ymm16, [rbx] vcvtph2ps ymm16, [rbx+r11*8+256] vcvtph2ps ymm16, [rbx+r11*8-256] vcvtph2ps ymm16{k5}, xmm0 vcvtph2ps ymm16{k5}, [rbx] vcvtph2ps ymm16{k5}, [rbx+r11*8+256] vcvtph2ps ymm16{k5}, [rbx+r11*8-256] vcvtph2ps ymm16{k5}{z}, xmm0 vcvtph2ps ymm16{k5}{z}, [rbx] vcvtph2ps ymm16{k5}{z}, [rbx+r11*8+256] vcvtph2ps ymm16{k5}{z}, [rbx+r11*8-256] vcvtph2ps zmm24, ymm15 vcvtph2ps zmm24, ymm15, {sae} vcvtph2ps zmm24, [rbx] vcvtph2ps zmm24, [rbx+r11*8+256] vcvtph2ps zmm24, [rbx+r11*8-256] vcvtph2ps zmm24{k5}, ymm15 vcvtph2ps zmm24{k5}, ymm15, {sae} vcvtph2ps zmm24{k5}, [rbx] vcvtph2ps zmm24{k5}, [rbx+r11*8+256] vcvtph2ps zmm24{k5}, [rbx+r11*8-256] vcvtph2ps zmm24{k5}{z}, ymm15 vcvtph2ps zmm24{k5}{z}, ymm15, {sae} vcvtph2ps zmm24{k5}{z}, [rbx] vcvtph2ps zmm24{k5}{z}, [rbx+r11*8+256] vcvtph2ps zmm24{k5}{z}, [rbx+r11*8-256] vcvtps2dq xmm2, xmm0 vcvtps2dq xmm2, [rbx] vcvtps2dq xmm2, [rbx]{1to4} vcvtps2dq xmm2, [rbx+r11*8+256] vcvtps2dq xmm2, [rbx+r11*8-256] vcvtps2dq xmm2{k5}, xmm0 vcvtps2dq xmm2{k5}, [rbx] vcvtps2dq xmm2{k5}, [rbx]{1to4} vcvtps2dq xmm2{k5}, [rbx+r11*8+256] vcvtps2dq xmm2{k5}, [rbx+r11*8-256] vcvtps2dq xmm2{k5}{z}, xmm0 vcvtps2dq xmm2{k5}{z}, [rbx] vcvtps2dq xmm2{k5}{z}, [rbx]{1to4} vcvtps2dq xmm2{k5}{z}, [rbx+r11*8+256] vcvtps2dq xmm2{k5}{z}, [rbx+r11*8-256] vcvtps2dq ymm16, ymm15 vcvtps2dq ymm16, [rbx] vcvtps2dq ymm16, [rbx]{1to8} vcvtps2dq ymm16, [rbx+r11*8+256] vcvtps2dq ymm16, [rbx+r11*8-256] vcvtps2dq ymm16{k5}, ymm15 vcvtps2dq ymm16{k5}, [rbx] vcvtps2dq ymm16{k5}, [rbx]{1to8} vcvtps2dq ymm16{k5}, [rbx+r11*8+256] vcvtps2dq ymm16{k5}, [rbx+r11*8-256] vcvtps2dq ymm16{k5}{z}, ymm15 vcvtps2dq ymm16{k5}{z}, [rbx] vcvtps2dq ymm16{k5}{z}, [rbx]{1to8} vcvtps2dq ymm16{k5}{z}, [rbx+r11*8+256] vcvtps2dq ymm16{k5}{z}, [rbx+r11*8-256] vcvtps2dq zmm24, zmm31 vcvtps2dq zmm24, zmm31, {rd-sae} vcvtps2dq zmm24, [rbx] vcvtps2dq zmm24, [rbx]{1to16} vcvtps2dq zmm24, [rbx+r11*8+256] vcvtps2dq zmm24, [rbx+r11*8-256] vcvtps2dq zmm24{k5}, zmm31 vcvtps2dq zmm24{k5}, zmm31, {rd-sae} vcvtps2dq zmm24{k5}, [rbx] vcvtps2dq zmm24{k5}, [rbx]{1to16} vcvtps2dq zmm24{k5}, [rbx+r11*8+256] vcvtps2dq zmm24{k5}, [rbx+r11*8-256] vcvtps2dq zmm24{k5}{z}, zmm31 vcvtps2dq zmm24{k5}{z}, zmm31, {rd-sae} vcvtps2dq zmm24{k5}{z}, [rbx] vcvtps2dq zmm24{k5}{z}, [rbx]{1to16} vcvtps2dq zmm24{k5}{z}, [rbx+r11*8+256] vcvtps2dq zmm24{k5}{z}, [rbx+r11*8-256] vcvtps2pd xmm2, xmm0 vcvtps2pd xmm2, [rbx] vcvtps2pd xmm2, [rbx]{1to2} vcvtps2pd xmm2, [rbx+r11*8+256] vcvtps2pd xmm2, [rbx+r11*8-256] vcvtps2pd xmm2{k5}, xmm0 vcvtps2pd xmm2{k5}, [rbx] vcvtps2pd xmm2{k5}, [rbx]{1to2} vcvtps2pd xmm2{k5}, [rbx+r11*8+256] vcvtps2pd xmm2{k5}, [rbx+r11*8-256] vcvtps2pd xmm2{k5}{z}, xmm0 vcvtps2pd xmm2{k5}{z}, [rbx] vcvtps2pd xmm2{k5}{z}, [rbx]{1to2} vcvtps2pd xmm2{k5}{z}, [rbx+r11*8+256] vcvtps2pd xmm2{k5}{z}, [rbx+r11*8-256] vcvtps2pd ymm16, xmm0 vcvtps2pd ymm16, [rbx] vcvtps2pd ymm16, [rbx]{1to4} vcvtps2pd ymm16, [rbx+r11*8+256] vcvtps2pd ymm16, [rbx+r11*8-256] vcvtps2pd ymm16{k5}, xmm0 vcvtps2pd ymm16{k5}, [rbx] vcvtps2pd ymm16{k5}, [rbx]{1to4} vcvtps2pd ymm16{k5}, [rbx+r11*8+256] vcvtps2pd ymm16{k5}, [rbx+r11*8-256] vcvtps2pd ymm16{k5}{z}, xmm0 vcvtps2pd ymm16{k5}{z}, [rbx] vcvtps2pd ymm16{k5}{z}, [rbx]{1to4} vcvtps2pd ymm16{k5}{z}, [rbx+r11*8+256] vcvtps2pd ymm16{k5}{z}, [rbx+r11*8-256] vcvtps2pd zmm24, ymm15 vcvtps2pd zmm24, ymm15, {sae} vcvtps2pd zmm24, [rbx] vcvtps2pd zmm24, [rbx]{1to8} vcvtps2pd zmm24, [rbx+r11*8+256] vcvtps2pd zmm24, [rbx+r11*8-256] vcvtps2pd zmm24{k5}, ymm15 vcvtps2pd zmm24{k5}, ymm15, {sae} vcvtps2pd zmm24{k5}, [rbx] vcvtps2pd zmm24{k5}, [rbx]{1to8} vcvtps2pd zmm24{k5}, [rbx+r11*8+256] vcvtps2pd zmm24{k5}, [rbx+r11*8-256] vcvtps2pd zmm24{k5}{z}, ymm15 vcvtps2pd zmm24{k5}{z}, ymm15, {sae} vcvtps2pd zmm24{k5}{z}, [rbx] vcvtps2pd zmm24{k5}{z}, [rbx]{1to8} vcvtps2pd zmm24{k5}{z}, [rbx+r11*8+256] vcvtps2pd zmm24{k5}{z}, [rbx+r11*8-256] vcvtps2ph xmm0, xmm2, 10 vcvtps2ph xmm0, ymm16, 10 vcvtps2ph ymm15, zmm24, 10 vcvtps2ph [rbx], xmm2, 10 vcvtps2ph [rbx], ymm16, 10 vcvtps2ph [rbx], zmm24, 10 vcvtps2ph [rbx+r11*8+256], xmm2, 10 vcvtps2ph [rbx+r11*8+256], ymm16, 10 vcvtps2ph [rbx+r11*8+256], zmm24, 10 vcvtps2ph [rbx+r11*8-256], xmm2, 10 vcvtps2ph [rbx+r11*8-256], ymm16, 10 vcvtps2ph [rbx+r11*8-256], zmm24, 10 vcvtps2udq xmm2, xmm0 vcvtps2udq xmm2, [rbx] vcvtps2udq xmm2, [rbx]{1to4} vcvtps2udq xmm2, [rbx+r11*8+256] vcvtps2udq xmm2, [rbx+r11*8-256] vcvtps2udq xmm2{k5}, xmm0 vcvtps2udq xmm2{k5}, [rbx] vcvtps2udq xmm2{k5}, [rbx]{1to4} vcvtps2udq xmm2{k5}, [rbx+r11*8+256] vcvtps2udq xmm2{k5}, [rbx+r11*8-256] vcvtps2udq xmm2{k5}{z}, xmm0 vcvtps2udq xmm2{k5}{z}, [rbx] vcvtps2udq xmm2{k5}{z}, [rbx]{1to4} vcvtps2udq xmm2{k5}{z}, [rbx+r11*8+256] vcvtps2udq xmm2{k5}{z}, [rbx+r11*8-256] vcvtps2udq ymm16, ymm15 vcvtps2udq ymm16, [rbx] vcvtps2udq ymm16, [rbx]{1to8} vcvtps2udq ymm16, [rbx+r11*8+256] vcvtps2udq ymm16, [rbx+r11*8-256] vcvtps2udq ymm16{k5}, ymm15 vcvtps2udq ymm16{k5}, [rbx] vcvtps2udq ymm16{k5}, [rbx]{1to8} vcvtps2udq ymm16{k5}, [rbx+r11*8+256] vcvtps2udq ymm16{k5}, [rbx+r11*8-256] vcvtps2udq ymm16{k5}{z}, ymm15 vcvtps2udq ymm16{k5}{z}, [rbx] vcvtps2udq ymm16{k5}{z}, [rbx]{1to8} vcvtps2udq ymm16{k5}{z}, [rbx+r11*8+256] vcvtps2udq ymm16{k5}{z}, [rbx+r11*8-256] vcvtps2udq zmm24, zmm31 vcvtps2udq zmm24, zmm31, {rd-sae} vcvtps2udq zmm24, [rbx] vcvtps2udq zmm24, [rbx]{1to16} vcvtps2udq zmm24, [rbx+r11*8+256] vcvtps2udq zmm24, [rbx+r11*8-256] vcvtps2udq zmm24{k5}, zmm31 vcvtps2udq zmm24{k5}, zmm31, {rd-sae} vcvtps2udq zmm24{k5}, [rbx] vcvtps2udq zmm24{k5}, [rbx]{1to16} vcvtps2udq zmm24{k5}, [rbx+r11*8+256] vcvtps2udq zmm24{k5}, [rbx+r11*8-256] vcvtps2udq zmm24{k5}{z}, zmm31 vcvtps2udq zmm24{k5}{z}, zmm31, {rd-sae} vcvtps2udq zmm24{k5}{z}, [rbx] vcvtps2udq zmm24{k5}{z}, [rbx]{1to16} vcvtps2udq zmm24{k5}{z}, [rbx+r11*8+256] vcvtps2udq zmm24{k5}{z}, [rbx+r11*8-256] vcvtsd2si ecx, xmm0 vcvtsd2si ecx, xmm0, {rd-sae} vcvtsd2si ecx, [rbx] vcvtsd2si ecx, [rbx+r11*8+256] vcvtsd2si ecx, [rbx+r11*8-256] vcvtsd2si rcx, xmm0 vcvtsd2si rcx, xmm0, {rd-sae} vcvtsd2si rcx, [rbx] vcvtsd2si rcx, [rbx+r11*8+256] vcvtsd2si rcx, [rbx+r11*8-256] vcvtsd2ss xmm2, xmm7, xmm0 vcvtsd2ss xmm2, xmm7, xmm0, {rd-sae} vcvtsd2ss xmm2, xmm7, [rbx] vcvtsd2ss xmm2, xmm7, [rbx+r11*8+256] vcvtsd2ss xmm2, xmm7, [rbx+r11*8-256] vcvtsd2ss xmm2{k5}, xmm7, xmm0 vcvtsd2ss xmm2{k5}, xmm7, xmm0, {rd-sae} vcvtsd2ss xmm2{k5}, xmm7, [rbx] vcvtsd2ss xmm2{k5}, xmm7, [rbx+r11*8+256] vcvtsd2ss xmm2{k5}, xmm7, [rbx+r11*8-256] vcvtsd2ss xmm2{k5}{z}, xmm7, xmm0 vcvtsd2ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vcvtsd2ss xmm2{k5}{z}, xmm7, [rbx] vcvtsd2ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vcvtsd2ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vcvtsd2usi ecx, xmm0 vcvtsd2usi ecx, xmm0, {rd-sae} vcvtsd2usi ecx, [rbx] vcvtsd2usi ecx, [rbx+r11*8+256] vcvtsd2usi ecx, [rbx+r11*8-256] vcvtsd2usi rcx, xmm0 vcvtsd2usi rcx, xmm0, {rd-sae} vcvtsd2usi rcx, [rbx] vcvtsd2usi rcx, [rbx+r11*8+256] vcvtsd2usi rcx, [rbx+r11*8-256] vcvtsi2sd xmm2, xmm7, ecx vcvtsi2sd xmm2, xmm7, rcx vcvtsi2sd xmm2, xmm7, [rbx] vcvtsi2sd xmm2, xmm7, [rbx+rsi*8+256] vcvtsi2sd xmm2, xmm7, ecx vcvtsi2sd xmm2, xmm7, rcx vcvtsi2sd xmm2, xmm7, [rbx] vcvtsi2sd xmm2, xmm7, [rbx+rsi*8+256] vcvtsi2ss xmm2, xmm7, ecx vcvtsi2ss xmm2, xmm7, rcx vcvtsi2ss xmm2, xmm7, [rbx] vcvtsi2ss xmm2, xmm7, [rbx+rsi*8+256] vcvtss2sd xmm2, xmm7, xmm0 vcvtss2sd xmm2, xmm7, xmm0, {sae} vcvtss2sd xmm2, xmm7, [rbx] vcvtss2sd xmm2, xmm7, [rbx+r11*8+256] vcvtss2sd xmm2, xmm7, [rbx+r11*8-256] vcvtss2sd xmm2{k5}, xmm7, xmm0 vcvtss2sd xmm2{k5}, xmm7, xmm0, {sae} vcvtss2sd xmm2{k5}, xmm7, [rbx] vcvtss2sd xmm2{k5}, xmm7, [rbx+r11*8+256] vcvtss2sd xmm2{k5}, xmm7, [rbx+r11*8-256] vcvtss2sd xmm2{k5}{z}, xmm7, xmm0 vcvtss2sd xmm2{k5}{z}, xmm7, xmm0, {sae} vcvtss2sd xmm2{k5}{z}, xmm7, [rbx] vcvtss2sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vcvtss2sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vcvtss2si ecx, xmm0 vcvtss2si ecx, xmm0, {rd-sae} vcvtss2si ecx, [rbx] vcvtss2si ecx, [rbx+r11*8+256] vcvtss2si ecx, [rbx+r11*8-256] vcvtss2si rcx, xmm0 vcvtss2si rcx, xmm0, {rd-sae} vcvtss2si rcx, [rbx] vcvtss2si rcx, [rbx+r11*8+256] vcvtss2si rcx, [rbx+r11*8-256] vcvtss2usi ecx, xmm0 vcvtss2usi ecx, xmm0, {rd-sae} vcvtss2usi ecx, [rbx] vcvtss2usi ecx, [rbx+r11*8+256] vcvtss2usi ecx, [rbx+r11*8-256] vcvtss2usi rcx, xmm0 vcvtss2usi rcx, xmm0, {rd-sae} vcvtss2usi rcx, [rbx] vcvtss2usi rcx, [rbx+r11*8+256] vcvtss2usi rcx, [rbx+r11*8-256] vcvttpd2dq xmm2, xmm0 vcvttpd2dq xmm2, ymm15 vcvttpd2dq xmm2, [rbx] vcvttpd2dq xmm2, [rbx]{1to2} vcvttpd2dq xmm2, [rbx]{1to4} vcvttpd2dq xmm2, [rbx+r11*8+256] vcvttpd2dq xmm2, [rbx+r11*8-256] vcvttpd2dq xmm2{k5}, xmm0 vcvttpd2dq xmm2{k5}, ymm15 vcvttpd2dq xmm2{k5}, [rbx]{1to2} vcvttpd2dq xmm2{k5}, [rbx]{1to4} vcvttpd2dq xmm2{k5}{z}, xmm0 vcvttpd2dq xmm2{k5}{z}, ymm15 vcvttpd2dq xmm2{k5}{z}, [rbx]{1to2} vcvttpd2dq xmm2{k5}{z}, [rbx]{1to4} vcvttpd2dq ymm16, zmm31 vcvttpd2dq ymm16, zmm31, {sae} vcvttpd2dq ymm16, [rbx] vcvttpd2dq ymm16, [rbx]{1to8} vcvttpd2dq ymm16, [rbx+r11*8+256] vcvttpd2dq ymm16, [rbx+r11*8-256] vcvttpd2dq ymm16{k5}, zmm31 vcvttpd2dq ymm16{k5}, zmm31, {sae} vcvttpd2dq ymm16{k5}, [rbx] vcvttpd2dq ymm16{k5}, [rbx]{1to8} vcvttpd2dq ymm16{k5}, [rbx+r11*8+256] vcvttpd2dq ymm16{k5}, [rbx+r11*8-256] vcvttpd2dq ymm16{k5}{z}, zmm31 vcvttpd2dq ymm16{k5}{z}, zmm31, {sae} vcvttpd2dq ymm16{k5}{z}, [rbx] vcvttpd2dq ymm16{k5}{z}, [rbx]{1to8} vcvttpd2dq ymm16{k5}{z}, [rbx+r11*8+256] vcvttpd2dq ymm16{k5}{z}, [rbx+r11*8-256] vcvttpd2udq xmm2, xmm0 vcvttpd2udq xmm2, ymm15 vcvttpd2udq xmm2, [rbx]{1to2} vcvttpd2udq xmm2, [rbx]{1to4} vcvttpd2udq xmm2{k5}, xmm0 vcvttpd2udq xmm2{k5}, ymm15 vcvttpd2udq xmm2{k5}, [rbx]{1to2} vcvttpd2udq xmm2{k5}, [rbx]{1to4} vcvttpd2udq xmm2{k5}{z}, xmm0 vcvttpd2udq xmm2{k5}{z}, ymm15 vcvttpd2udq xmm2{k5}{z}, [rbx]{1to2} vcvttpd2udq xmm2{k5}{z}, [rbx]{1to4} vcvttpd2udq ymm16, zmm31 vcvttpd2udq ymm16, zmm31, {sae} vcvttpd2udq ymm16, [rbx] vcvttpd2udq ymm16, [rbx]{1to8} vcvttpd2udq ymm16, [rbx+r11*8+256] vcvttpd2udq ymm16, [rbx+r11*8-256] vcvttpd2udq ymm16{k5}, zmm31 vcvttpd2udq ymm16{k5}, zmm31, {sae} vcvttpd2udq ymm16{k5}, [rbx] vcvttpd2udq ymm16{k5}, [rbx]{1to8} vcvttpd2udq ymm16{k5}, [rbx+r11*8+256] vcvttpd2udq ymm16{k5}, [rbx+r11*8-256] vcvttpd2udq ymm16{k5}{z}, zmm31 vcvttpd2udq ymm16{k5}{z}, zmm31, {sae} vcvttpd2udq ymm16{k5}{z}, [rbx] vcvttpd2udq ymm16{k5}{z}, [rbx]{1to8} vcvttpd2udq ymm16{k5}{z}, [rbx+r11*8+256] vcvttpd2udq ymm16{k5}{z}, [rbx+r11*8-256] vcvttps2dq xmm2, xmm0 vcvttps2dq xmm2, [rbx] vcvttps2dq xmm2, [rbx]{1to4} vcvttps2dq xmm2, [rbx+r11*8+256] vcvttps2dq xmm2, [rbx+r11*8-256] vcvttps2dq xmm2{k5}, xmm0 vcvttps2dq xmm2{k5}, [rbx] vcvttps2dq xmm2{k5}, [rbx]{1to4} vcvttps2dq xmm2{k5}, [rbx+r11*8+256] vcvttps2dq xmm2{k5}, [rbx+r11*8-256] vcvttps2dq xmm2{k5}{z}, xmm0 vcvttps2dq xmm2{k5}{z}, [rbx] vcvttps2dq xmm2{k5}{z}, [rbx]{1to4} vcvttps2dq xmm2{k5}{z}, [rbx+r11*8+256] vcvttps2dq xmm2{k5}{z}, [rbx+r11*8-256] vcvttps2dq ymm16, ymm15 vcvttps2dq ymm16, [rbx] vcvttps2dq ymm16, [rbx]{1to8} vcvttps2dq ymm16, [rbx+r11*8+256] vcvttps2dq ymm16, [rbx+r11*8-256] vcvttps2dq ymm16{k5}, ymm15 vcvttps2dq ymm16{k5}, [rbx] vcvttps2dq ymm16{k5}, [rbx]{1to8} vcvttps2dq ymm16{k5}, [rbx+r11*8+256] vcvttps2dq ymm16{k5}, [rbx+r11*8-256] vcvttps2dq ymm16{k5}{z}, ymm15 vcvttps2dq ymm16{k5}{z}, [rbx] vcvttps2dq ymm16{k5}{z}, [rbx]{1to8} vcvttps2dq ymm16{k5}{z}, [rbx+r11*8+256] vcvttps2dq ymm16{k5}{z}, [rbx+r11*8-256] vcvttps2dq zmm24, zmm31 vcvttps2dq zmm24, zmm31, {sae} vcvttps2dq zmm24, [rbx] vcvttps2dq zmm24, [rbx]{1to16} vcvttps2dq zmm24, [rbx+r11*8+256] vcvttps2dq zmm24, [rbx+r11*8-256] vcvttps2dq zmm24{k5}, zmm31 vcvttps2dq zmm24{k5}, zmm31, {sae} vcvttps2dq zmm24{k5}, [rbx] vcvttps2dq zmm24{k5}, [rbx]{1to16} vcvttps2dq zmm24{k5}, [rbx+r11*8+256] vcvttps2dq zmm24{k5}, [rbx+r11*8-256] vcvttps2dq zmm24{k5}{z}, zmm31 vcvttps2dq zmm24{k5}{z}, zmm31, {sae} vcvttps2dq zmm24{k5}{z}, [rbx] vcvttps2dq zmm24{k5}{z}, [rbx]{1to16} vcvttps2dq zmm24{k5}{z}, [rbx+r11*8+256] vcvttps2dq zmm24{k5}{z}, [rbx+r11*8-256] vcvttps2udq xmm2, xmm0 vcvttps2udq xmm2, [rbx] vcvttps2udq xmm2, [rbx]{1to4} vcvttps2udq xmm2, [rbx+r11*8+256] vcvttps2udq xmm2, [rbx+r11*8-256] vcvttps2udq xmm2{k5}, xmm0 vcvttps2udq xmm2{k5}, [rbx] vcvttps2udq xmm2{k5}, [rbx]{1to4} vcvttps2udq xmm2{k5}, [rbx+r11*8+256] vcvttps2udq xmm2{k5}, [rbx+r11*8-256] vcvttps2udq xmm2{k5}{z}, xmm0 vcvttps2udq xmm2{k5}{z}, [rbx] vcvttps2udq xmm2{k5}{z}, [rbx]{1to4} vcvttps2udq xmm2{k5}{z}, [rbx+r11*8+256] vcvttps2udq xmm2{k5}{z}, [rbx+r11*8-256] vcvttps2udq ymm16, ymm15 vcvttps2udq ymm16, [rbx] vcvttps2udq ymm16, [rbx]{1to8} vcvttps2udq ymm16, [rbx+r11*8+256] vcvttps2udq ymm16, [rbx+r11*8-256] vcvttps2udq ymm16{k5}, ymm15 vcvttps2udq ymm16{k5}, [rbx] vcvttps2udq ymm16{k5}, [rbx]{1to8} vcvttps2udq ymm16{k5}, [rbx+r11*8+256] vcvttps2udq ymm16{k5}, [rbx+r11*8-256] vcvttps2udq ymm16{k5}{z}, ymm15 vcvttps2udq ymm16{k5}{z}, [rbx] vcvttps2udq ymm16{k5}{z}, [rbx]{1to8} vcvttps2udq ymm16{k5}{z}, [rbx+r11*8+256] vcvttps2udq ymm16{k5}{z}, [rbx+r11*8-256] vcvttps2udq zmm24, zmm31 vcvttps2udq zmm24, zmm31, {sae} vcvttps2udq zmm24, [rbx] vcvttps2udq zmm24, [rbx]{1to16} vcvttps2udq zmm24, [rbx+r11*8+256] vcvttps2udq zmm24, [rbx+r11*8-256] vcvttps2udq zmm24{k5}, zmm31 vcvttps2udq zmm24{k5}, zmm31, {sae} vcvttps2udq zmm24{k5}, [rbx] vcvttps2udq zmm24{k5}, [rbx]{1to16} vcvttps2udq zmm24{k5}, [rbx+r11*8+256] vcvttps2udq zmm24{k5}, [rbx+r11*8-256] vcvttps2udq zmm24{k5}{z}, zmm31 vcvttps2udq zmm24{k5}{z}, zmm31, {sae} vcvttps2udq zmm24{k5}{z}, [rbx] vcvttps2udq zmm24{k5}{z}, [rbx]{1to16} vcvttps2udq zmm24{k5}{z}, [rbx+r11*8+256] vcvttps2udq zmm24{k5}{z}, [rbx+r11*8-256] vcvttsd2si ecx, xmm0 vcvttsd2si ecx, xmm0, {sae} vcvttsd2si ecx, [rbx] vcvttsd2si ecx, [rbx+r11*8+256] vcvttsd2si ecx, [rbx+r11*8-256] vcvttsd2si rcx, xmm0 vcvttsd2si rcx, xmm0, {sae} vcvttsd2si rcx, [rbx] vcvttsd2si rcx, [rbx+r11*8+256] vcvttsd2si rcx, [rbx+r11*8-256] vcvttsd2usi ecx, xmm0 vcvttsd2usi ecx, xmm0, {sae} vcvttsd2usi ecx, [rbx] vcvttsd2usi ecx, [rbx+r11*8+256] vcvttsd2usi ecx, [rbx+r11*8-256] vcvttsd2usi rcx, xmm0 vcvttsd2usi rcx, xmm0, {sae} vcvttsd2usi rcx, [rbx] vcvttsd2usi rcx, [rbx+r11*8+256] vcvttsd2usi rcx, [rbx+r11*8-256] vcvttss2si ecx, xmm0 vcvttss2si ecx, xmm0, {sae} vcvttss2si ecx, [rbx] vcvttss2si ecx, [rbx+r11*8+256] vcvttss2si ecx, [rbx+r11*8-256] vcvttss2si rcx, xmm0 vcvttss2si rcx, xmm0, {sae} vcvttss2si rcx, [rbx] vcvttss2si rcx, [rbx+r11*8+256] vcvttss2si rcx, [rbx+r11*8-256] vcvttss2usi ecx, xmm0 vcvttss2usi ecx, xmm0, {sae} vcvttss2usi ecx, [rbx] vcvttss2usi ecx, [rbx+r11*8+256] vcvttss2usi ecx, [rbx+r11*8-256] vcvttss2usi rcx, xmm0 vcvttss2usi rcx, xmm0, {sae} vcvttss2usi rcx, [rbx] vcvttss2usi rcx, [rbx+r11*8+256] vcvttss2usi rcx, [rbx+r11*8-256] vcvtudq2pd xmm2, xmm0 vcvtudq2pd xmm2, [rbx] vcvtudq2pd xmm2, [rbx]{1to2} vcvtudq2pd xmm2, [rbx+r11*8+256] vcvtudq2pd xmm2, [rbx+r11*8-256] vcvtudq2pd xmm2{k5}, xmm0 vcvtudq2pd xmm2{k5}, [rbx] vcvtudq2pd xmm2{k5}, [rbx]{1to2} vcvtudq2pd xmm2{k5}, [rbx+r11*8+256] vcvtudq2pd xmm2{k5}, [rbx+r11*8-256] vcvtudq2pd xmm2{k5}{z}, xmm0 vcvtudq2pd xmm2{k5}{z}, [rbx] vcvtudq2pd xmm2{k5}{z}, [rbx]{1to2} vcvtudq2pd xmm2{k5}{z}, [rbx+r11*8+256] vcvtudq2pd xmm2{k5}{z}, [rbx+r11*8-256] vcvtudq2pd ymm16, xmm0 vcvtudq2pd ymm16, [rbx] vcvtudq2pd ymm16, [rbx]{1to4} vcvtudq2pd ymm16, [rbx+r11*8+256] vcvtudq2pd ymm16, [rbx+r11*8-256] vcvtudq2pd ymm16{k5}, xmm0 vcvtudq2pd ymm16{k5}, [rbx] vcvtudq2pd ymm16{k5}, [rbx]{1to4} vcvtudq2pd ymm16{k5}, [rbx+r11*8+256] vcvtudq2pd ymm16{k5}, [rbx+r11*8-256] vcvtudq2pd ymm16{k5}{z}, xmm0 vcvtudq2pd ymm16{k5}{z}, [rbx] vcvtudq2pd ymm16{k5}{z}, [rbx]{1to4} vcvtudq2pd ymm16{k5}{z}, [rbx+r11*8+256] vcvtudq2pd ymm16{k5}{z}, [rbx+r11*8-256] vcvtudq2pd zmm24, ymm15 vcvtudq2pd zmm24, [rbx] vcvtudq2pd zmm24, [rbx]{1to8} vcvtudq2pd zmm24, [rbx+r11*8+256] vcvtudq2pd zmm24, [rbx+r11*8-256] vcvtudq2pd zmm24{k5}, ymm15 vcvtudq2pd zmm24{k5}, [rbx] vcvtudq2pd zmm24{k5}, [rbx]{1to8} vcvtudq2pd zmm24{k5}, [rbx+r11*8+256] vcvtudq2pd zmm24{k5}, [rbx+r11*8-256] vcvtudq2pd zmm24{k5}{z}, ymm15 vcvtudq2pd zmm24{k5}{z}, [rbx] vcvtudq2pd zmm24{k5}{z}, [rbx]{1to8} vcvtudq2pd zmm24{k5}{z}, [rbx+r11*8+256] vcvtudq2pd zmm24{k5}{z}, [rbx+r11*8-256] vcvtudq2ps xmm2, xmm0 vcvtudq2ps xmm2, [rbx] vcvtudq2ps xmm2, [rbx]{1to4} vcvtudq2ps xmm2, [rbx+r11*8+256] vcvtudq2ps xmm2, [rbx+r11*8-256] vcvtudq2ps xmm2{k5}, xmm0 vcvtudq2ps xmm2{k5}, [rbx] vcvtudq2ps xmm2{k5}, [rbx]{1to4} vcvtudq2ps xmm2{k5}, [rbx+r11*8+256] vcvtudq2ps xmm2{k5}, [rbx+r11*8-256] vcvtudq2ps xmm2{k5}{z}, xmm0 vcvtudq2ps xmm2{k5}{z}, [rbx] vcvtudq2ps xmm2{k5}{z}, [rbx]{1to4} vcvtudq2ps xmm2{k5}{z}, [rbx+r11*8+256] vcvtudq2ps xmm2{k5}{z}, [rbx+r11*8-256] vcvtudq2ps ymm16, ymm15 vcvtudq2ps ymm16, [rbx] vcvtudq2ps ymm16, [rbx]{1to8} vcvtudq2ps ymm16, [rbx+r11*8+256] vcvtudq2ps ymm16, [rbx+r11*8-256] vcvtudq2ps ymm16{k5}, ymm15 vcvtudq2ps ymm16{k5}, [rbx] vcvtudq2ps ymm16{k5}, [rbx]{1to8} vcvtudq2ps ymm16{k5}, [rbx+r11*8+256] vcvtudq2ps ymm16{k5}, [rbx+r11*8-256] vcvtudq2ps ymm16{k5}{z}, ymm15 vcvtudq2ps ymm16{k5}{z}, [rbx] vcvtudq2ps ymm16{k5}{z}, [rbx]{1to8} vcvtudq2ps ymm16{k5}{z}, [rbx+r11*8+256] vcvtudq2ps ymm16{k5}{z}, [rbx+r11*8-256] vcvtudq2ps zmm24, zmm31 vcvtudq2ps zmm24, zmm31, {rd-sae} vcvtudq2ps zmm24, [rbx] vcvtudq2ps zmm24, [rbx]{1to16} vcvtudq2ps zmm24, [rbx+r11*8+256] vcvtudq2ps zmm24, [rbx+r11*8-256] vcvtudq2ps zmm24{k5}, zmm31 vcvtudq2ps zmm24{k5}, zmm31, {rd-sae} vcvtudq2ps zmm24{k5}, [rbx] vcvtudq2ps zmm24{k5}, [rbx]{1to16} vcvtudq2ps zmm24{k5}, [rbx+r11*8+256] vcvtudq2ps zmm24{k5}, [rbx+r11*8-256] vcvtudq2ps zmm24{k5}{z}, zmm31 vcvtudq2ps zmm24{k5}{z}, zmm31, {rd-sae} vcvtudq2ps zmm24{k5}{z}, [rbx] vcvtudq2ps zmm24{k5}{z}, [rbx]{1to16} vcvtudq2ps zmm24{k5}{z}, [rbx+r11*8+256] vcvtudq2ps zmm24{k5}{z}, [rbx+r11*8-256] vcvtusi2sd xmm2, xmm7, ecx vcvtusi2sd xmm2, xmm7, rcx vcvtusi2sd xmm2, xmm7, ecx vcvtusi2sd xmm2, xmm7, rcx vcvtusi2ss xmm2, xmm7, ecx vcvtusi2ss xmm2, xmm7, rcx vdivpd xmm2, xmm7, xmm0 vdivpd xmm2, xmm7, [rbx] vdivpd xmm2, xmm7, [rbx]{1to2} vdivpd xmm2, xmm7, [rbx+r11*8+256] vdivpd xmm2, xmm7, [rbx+r11*8-256] vdivpd xmm2{k5}, xmm7, xmm0 vdivpd xmm2{k5}, xmm7, [rbx] vdivpd xmm2{k5}, xmm7, [rbx]{1to2} vdivpd xmm2{k5}, xmm7, [rbx+r11*8+256] vdivpd xmm2{k5}, xmm7, [rbx+r11*8-256] vdivpd xmm2{k5}{z}, xmm7, xmm0 vdivpd xmm2{k5}{z}, xmm7, [rbx] vdivpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vdivpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vdivpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vdivpd ymm16, ymm13, ymm15 vdivpd ymm16, ymm13, [rbx] vdivpd ymm16, ymm13, [rbx]{1to4} vdivpd ymm16, ymm13, [rbx+r11*8+256] vdivpd ymm16, ymm13, [rbx+r11*8-256] vdivpd ymm16{k5}, ymm13, ymm15 vdivpd ymm16{k5}, ymm13, [rbx] vdivpd ymm16{k5}, ymm13, [rbx]{1to4} vdivpd ymm16{k5}, ymm13, [rbx+r11*8+256] vdivpd ymm16{k5}, ymm13, [rbx+r11*8-256] vdivpd ymm16{k5}{z}, ymm13, ymm15 vdivpd ymm16{k5}{z}, ymm13, [rbx] vdivpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vdivpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vdivpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vdivpd zmm24, zmm24, zmm31 vdivpd zmm24, zmm24, zmm31, {rd-sae} vdivpd zmm24, zmm24, [rbx] vdivpd zmm24, zmm24, [rbx]{1to8} vdivpd zmm24, zmm24, [rbx+r11*8+256] vdivpd zmm24, zmm24, [rbx+r11*8-256] vdivpd zmm24{k5}, zmm24, zmm31 vdivpd zmm24{k5}, zmm24, zmm31, {rd-sae} vdivpd zmm24{k5}, zmm24, [rbx] vdivpd zmm24{k5}, zmm24, [rbx]{1to8} vdivpd zmm24{k5}, zmm24, [rbx+r11*8+256] vdivpd zmm24{k5}, zmm24, [rbx+r11*8-256] vdivpd zmm24{k5}{z}, zmm24, zmm31 vdivpd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vdivpd zmm24{k5}{z}, zmm24, [rbx] vdivpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vdivpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vdivpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vdivps xmm2, xmm7, xmm0 vdivps xmm2, xmm7, [rbx] vdivps xmm2, xmm7, [rbx]{1to4} vdivps xmm2, xmm7, [rbx+r11*8+256] vdivps xmm2, xmm7, [rbx+r11*8-256] vdivps xmm2{k5}, xmm7, xmm0 vdivps xmm2{k5}, xmm7, [rbx] vdivps xmm2{k5}, xmm7, [rbx]{1to4} vdivps xmm2{k5}, xmm7, [rbx+r11*8+256] vdivps xmm2{k5}, xmm7, [rbx+r11*8-256] vdivps xmm2{k5}{z}, xmm7, xmm0 vdivps xmm2{k5}{z}, xmm7, [rbx] vdivps xmm2{k5}{z}, xmm7, [rbx]{1to4} vdivps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vdivps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vdivps ymm16, ymm13, ymm15 vdivps ymm16, ymm13, [rbx] vdivps ymm16, ymm13, [rbx]{1to8} vdivps ymm16, ymm13, [rbx+r11*8+256] vdivps ymm16, ymm13, [rbx+r11*8-256] vdivps ymm16{k5}, ymm13, ymm15 vdivps ymm16{k5}, ymm13, [rbx] vdivps ymm16{k5}, ymm13, [rbx]{1to8} vdivps ymm16{k5}, ymm13, [rbx+r11*8+256] vdivps ymm16{k5}, ymm13, [rbx+r11*8-256] vdivps ymm16{k5}{z}, ymm13, ymm15 vdivps ymm16{k5}{z}, ymm13, [rbx] vdivps ymm16{k5}{z}, ymm13, [rbx]{1to8} vdivps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vdivps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vdivps zmm24, zmm24, zmm31 vdivps zmm24, zmm24, zmm31, {rd-sae} vdivps zmm24, zmm24, [rbx] vdivps zmm24, zmm24, [rbx]{1to16} vdivps zmm24, zmm24, [rbx+r11*8+256] vdivps zmm24, zmm24, [rbx+r11*8-256] vdivps zmm24{k5}, zmm24, zmm31 vdivps zmm24{k5}, zmm24, zmm31, {rd-sae} vdivps zmm24{k5}, zmm24, [rbx] vdivps zmm24{k5}, zmm24, [rbx]{1to16} vdivps zmm24{k5}, zmm24, [rbx+r11*8+256] vdivps zmm24{k5}, zmm24, [rbx+r11*8-256] vdivps zmm24{k5}{z}, zmm24, zmm31 vdivps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vdivps zmm24{k5}{z}, zmm24, [rbx] vdivps zmm24{k5}{z}, zmm24, [rbx]{1to16} vdivps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vdivps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vdivsd xmm2, xmm7, xmm0 vdivsd xmm2, xmm7, xmm0, {rd-sae} vdivsd xmm2, xmm7, [rbx] vdivsd xmm2, xmm7, [rbx+r11*8+256] vdivsd xmm2, xmm7, [rbx+r11*8-256] vdivsd xmm2{k5}, xmm7, xmm0 vdivsd xmm2{k5}, xmm7, xmm0, {rd-sae} vdivsd xmm2{k5}, xmm7, [rbx] vdivsd xmm2{k5}, xmm7, [rbx+r11*8+256] vdivsd xmm2{k5}, xmm7, [rbx+r11*8-256] vdivsd xmm2{k5}{z}, xmm7, xmm0 vdivsd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vdivsd xmm2{k5}{z}, xmm7, [rbx] vdivsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vdivsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vdivss xmm2, xmm7, xmm0 vdivss xmm2, xmm7, xmm0, {rd-sae} vdivss xmm2, xmm7, [rbx] vdivss xmm2, xmm7, [rbx+r11*8+256] vdivss xmm2, xmm7, [rbx+r11*8-256] vdivss xmm2{k5}, xmm7, xmm0 vdivss xmm2{k5}, xmm7, xmm0, {rd-sae} vdivss xmm2{k5}, xmm7, [rbx] vdivss xmm2{k5}, xmm7, [rbx+r11*8+256] vdivss xmm2{k5}, xmm7, [rbx+r11*8-256] vdivss xmm2{k5}{z}, xmm7, xmm0 vdivss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vdivss xmm2{k5}{z}, xmm7, [rbx] vdivss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vdivss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vexpandpd xmm2, xmm0 vexpandpd xmm2, [rbx] vexpandpd xmm2, [rbx+r11*8+256] vexpandpd xmm2, [rbx+r11*8-256] vexpandpd xmm2{k5}, xmm0 vexpandpd xmm2{k5}, [rbx] vexpandpd xmm2{k5}, [rbx+r11*8+256] vexpandpd xmm2{k5}, [rbx+r11*8-256] vexpandpd xmm2{k5}{z}, xmm0 vexpandpd xmm2{k5}{z}, [rbx] vexpandpd xmm2{k5}{z}, [rbx+r11*8+256] vexpandpd xmm2{k5}{z}, [rbx+r11*8-256] vexpandpd ymm16, ymm15 vexpandpd ymm16, [rbx] vexpandpd ymm16, [rbx+r11*8+256] vexpandpd ymm16, [rbx+r11*8-256] vexpandpd ymm16{k5}, ymm15 vexpandpd ymm16{k5}, [rbx] vexpandpd ymm16{k5}, [rbx+r11*8+256] vexpandpd ymm16{k5}, [rbx+r11*8-256] vexpandpd ymm16{k5}{z}, ymm15 vexpandpd ymm16{k5}{z}, [rbx] vexpandpd ymm16{k5}{z}, [rbx+r11*8+256] vexpandpd ymm16{k5}{z}, [rbx+r11*8-256] vexpandpd zmm24, zmm31 vexpandpd zmm24, [rbx] vexpandpd zmm24, [rbx+r11*8+256] vexpandpd zmm24, [rbx+r11*8-256] vexpandpd zmm24{k5}, zmm31 vexpandpd zmm24{k5}, [rbx] vexpandpd zmm24{k5}, [rbx+r11*8+256] vexpandpd zmm24{k5}, [rbx+r11*8-256] vexpandpd zmm24{k5}{z}, zmm31 vexpandpd zmm24{k5}{z}, [rbx] vexpandpd zmm24{k5}{z}, [rbx+r11*8+256] vexpandpd zmm24{k5}{z}, [rbx+r11*8-256] vexpandps xmm2, xmm0 vexpandps xmm2, [rbx] vexpandps xmm2, [rbx+r11*8+256] vexpandps xmm2, [rbx+r11*8-256] vexpandps xmm2{k5}, xmm0 vexpandps xmm2{k5}, [rbx] vexpandps xmm2{k5}, [rbx+r11*8+256] vexpandps xmm2{k5}, [rbx+r11*8-256] vexpandps xmm2{k5}{z}, xmm0 vexpandps xmm2{k5}{z}, [rbx] vexpandps xmm2{k5}{z}, [rbx+r11*8+256] vexpandps xmm2{k5}{z}, [rbx+r11*8-256] vexpandps ymm16, ymm15 vexpandps ymm16, [rbx] vexpandps ymm16, [rbx+r11*8+256] vexpandps ymm16, [rbx+r11*8-256] vexpandps ymm16{k5}, ymm15 vexpandps ymm16{k5}, [rbx] vexpandps ymm16{k5}, [rbx+r11*8+256] vexpandps ymm16{k5}, [rbx+r11*8-256] vexpandps ymm16{k5}{z}, ymm15 vexpandps ymm16{k5}{z}, [rbx] vexpandps ymm16{k5}{z}, [rbx+r11*8+256] vexpandps ymm16{k5}{z}, [rbx+r11*8-256] vexpandps zmm24, zmm31 vexpandps zmm24, [rbx] vexpandps zmm24, [rbx+r11*8+256] vexpandps zmm24, [rbx+r11*8-256] vexpandps zmm24{k5}, zmm31 vexpandps zmm24{k5}, [rbx] vexpandps zmm24{k5}, [rbx+r11*8+256] vexpandps zmm24{k5}, [rbx+r11*8-256] vexpandps zmm24{k5}{z}, zmm31 vexpandps zmm24{k5}{z}, [rbx] vexpandps zmm24{k5}{z}, [rbx+r11*8+256] vexpandps zmm24{k5}{z}, [rbx+r11*8-256] vextractf32x4 xmm0, ymm16, 10 vextractf32x4 xmm0, zmm24, 10 vextractf32x4 [rbx], ymm16, 10 vextractf32x4 [rbx], zmm24, 10 vextractf32x4 [rbx+r11*8+256], ymm16, 10 vextractf32x4 [rbx+r11*8+256], zmm24, 10 vextractf32x4 [rbx+r11*8-256], ymm16, 10 vextractf32x4 [rbx+r11*8-256], zmm24, 10 vextractf64x4 ymm15, zmm24, 10 vextractf64x4 [rbx], zmm24, 10 vextractf64x4 [rbx+r11*8+256], zmm24, 10 vextractf64x4 [rbx+r11*8-256], zmm24, 10 vextracti32x4 xmm0, ymm16, 10 vextracti32x4 xmm0, zmm24, 10 vextracti32x4 [rbx], ymm16, 10 vextracti32x4 [rbx], zmm24, 10 vextracti32x4 [rbx+r11*8+256], ymm16, 10 vextracti32x4 [rbx+r11*8+256], zmm24, 10 vextracti32x4 [rbx+r11*8-256], ymm16, 10 vextracti32x4 [rbx+r11*8-256], zmm24, 10 vextracti64x4 ymm15, zmm24, 10 vextracti64x4 [rbx], zmm24, 10 vextracti64x4 [rbx+r11*8+256], zmm24, 10 vextracti64x4 [rbx+r11*8-256], zmm24, 10 vextractps [rbx], xmm2, 10 vextractps [rbx+rsi*8+256], xmm2, 10 vextractps [rbx+rsi*8-256], xmm2, 10 vextractps ecx, xmm2, 10 vextractps rcx, xmm2, 10 vfixupimmpd xmm2, xmm7, xmm0, 10 vfixupimmpd xmm2, xmm7, [rbx], 10 vfixupimmpd xmm2, xmm7, [rbx]{1to2}, 10 vfixupimmpd xmm2, xmm7, [rbx+r11*8+256], 10 vfixupimmpd xmm2, xmm7, [rbx+r11*8-256], 10 vfixupimmpd xmm2{k5}, xmm7, xmm0, 10 vfixupimmpd xmm2{k5}, xmm7, [rbx], 10 vfixupimmpd xmm2{k5}, xmm7, [rbx]{1to2}, 10 vfixupimmpd xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vfixupimmpd xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vfixupimmpd xmm2{k5}{z}, xmm7, xmm0, 10 vfixupimmpd xmm2{k5}{z}, xmm7, [rbx], 10 vfixupimmpd xmm2{k5}{z}, xmm7, [rbx]{1to2}, 10 vfixupimmpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vfixupimmpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vfixupimmpd ymm16, ymm13, ymm15, 10 vfixupimmpd ymm16, ymm13, [rbx], 10 vfixupimmpd ymm16, ymm13, [rbx]{1to4}, 10 vfixupimmpd ymm16, ymm13, [rbx+r11*8+256], 10 vfixupimmpd ymm16, ymm13, [rbx+r11*8-256], 10 vfixupimmpd ymm16{k5}, ymm13, ymm15, 10 vfixupimmpd ymm16{k5}, ymm13, [rbx], 10 vfixupimmpd ymm16{k5}, ymm13, [rbx]{1to4}, 10 vfixupimmpd ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vfixupimmpd ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vfixupimmpd ymm16{k5}{z}, ymm13, ymm15, 10 vfixupimmpd ymm16{k5}{z}, ymm13, [rbx], 10 vfixupimmpd ymm16{k5}{z}, ymm13, [rbx]{1to4}, 10 vfixupimmpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vfixupimmpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vfixupimmpd zmm24, zmm24, zmm31, 10 vfixupimmpd zmm24, zmm24, [rbx], 10 vfixupimmpd zmm24, zmm24, [rbx]{1to8}, 10 vfixupimmpd zmm24, zmm24, [rbx+r11*8+256], 10 vfixupimmpd zmm24, zmm24, [rbx+r11*8-256], 10 vfixupimmpd zmm24{k5}, zmm24, zmm31, 10 vfixupimmpd zmm24{k5}, zmm24, [rbx], 10 vfixupimmpd zmm24{k5}, zmm24, [rbx]{1to8}, 10 vfixupimmpd zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vfixupimmpd zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vfixupimmpd zmm24{k5}{z}, zmm24, zmm31, 10 vfixupimmpd zmm24{k5}{z}, zmm24, [rbx], 10 vfixupimmpd zmm24{k5}{z}, zmm24, [rbx]{1to8}, 10 vfixupimmpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vfixupimmpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vfixupimmps xmm2, xmm7, xmm0, 10 vfixupimmps xmm2, xmm7, [rbx], 10 vfixupimmps xmm2, xmm7, [rbx]{1to4}, 10 vfixupimmps xmm2, xmm7, [rbx+r11*8+256], 10 vfixupimmps xmm2, xmm7, [rbx+r11*8-256], 10 vfixupimmps xmm2{k5}, xmm7, xmm0, 10 vfixupimmps xmm2{k5}, xmm7, [rbx], 10 vfixupimmps xmm2{k5}, xmm7, [rbx]{1to4}, 10 vfixupimmps xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vfixupimmps xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vfixupimmps xmm2{k5}{z}, xmm7, xmm0, 10 vfixupimmps xmm2{k5}{z}, xmm7, [rbx], 10 vfixupimmps xmm2{k5}{z}, xmm7, [rbx]{1to4}, 10 vfixupimmps xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vfixupimmps xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vfixupimmps ymm16, ymm13, ymm15, 10 vfixupimmps ymm16, ymm13, [rbx], 10 vfixupimmps ymm16, ymm13, [rbx]{1to8}, 10 vfixupimmps ymm16, ymm13, [rbx+r11*8+256], 10 vfixupimmps ymm16, ymm13, [rbx+r11*8-256], 10 vfixupimmps ymm16{k5}, ymm13, ymm15, 10 vfixupimmps ymm16{k5}, ymm13, [rbx], 10 vfixupimmps ymm16{k5}, ymm13, [rbx]{1to8}, 10 vfixupimmps ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vfixupimmps ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vfixupimmps ymm16{k5}{z}, ymm13, ymm15, 10 vfixupimmps ymm16{k5}{z}, ymm13, [rbx], 10 vfixupimmps ymm16{k5}{z}, ymm13, [rbx]{1to8}, 10 vfixupimmps ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vfixupimmps ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vfixupimmps zmm24, zmm24, zmm31, 10 vfixupimmps zmm24, zmm24, [rbx], 10 vfixupimmps zmm24, zmm24, [rbx]{1to16}, 10 vfixupimmps zmm24, zmm24, [rbx+r11*8+256], 10 vfixupimmps zmm24, zmm24, [rbx+r11*8-256], 10 vfixupimmps zmm24{k5}, zmm24, zmm31, 10 vfixupimmps zmm24{k5}, zmm24, [rbx], 10 vfixupimmps zmm24{k5}, zmm24, [rbx]{1to16}, 10 vfixupimmps zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vfixupimmps zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vfixupimmps zmm24{k5}{z}, zmm24, zmm31, 10 vfixupimmps zmm24{k5}{z}, zmm24, [rbx], 10 vfixupimmps zmm24{k5}{z}, zmm24, [rbx]{1to16}, 10 vfixupimmps zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vfixupimmps zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vfixupimmsd xmm2, xmm7, xmm0, 10 vfixupimmsd xmm2, xmm7, [rbx], 10 vfixupimmsd xmm2, xmm7, [rbx+r11*8+256], 10 vfixupimmsd xmm2, xmm7, [rbx+r11*8-256], 10 vfixupimmsd xmm2{k5}, xmm7, xmm0, 10 vfixupimmsd xmm2{k5}, xmm7, [rbx], 10 vfixupimmsd xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vfixupimmsd xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vfixupimmsd xmm2{k5}{z}, xmm7, xmm0, 10 vfixupimmsd xmm2{k5}{z}, xmm7, [rbx], 10 vfixupimmsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vfixupimmsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vfixupimmss xmm2, xmm7, xmm0, 10 vfixupimmss xmm2, xmm7, [rbx], 10 vfixupimmss xmm2, xmm7, [rbx+r11*8+256], 10 vfixupimmss xmm2, xmm7, [rbx+r11*8-256], 10 vfixupimmss xmm2{k5}, xmm7, xmm0, 10 vfixupimmss xmm2{k5}, xmm7, [rbx], 10 vfixupimmss xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vfixupimmss xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vfixupimmss xmm2{k5}{z}, xmm7, xmm0, 10 vfixupimmss xmm2{k5}{z}, xmm7, [rbx], 10 vfixupimmss xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vfixupimmss xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vfmadd132pd xmm2, xmm7, xmm0 vfmadd132pd xmm2, xmm7, [rbx] vfmadd132pd xmm2, xmm7, [rbx]{1to2} vfmadd132pd xmm2, xmm7, [rbx+r11*8+256] vfmadd132pd xmm2, xmm7, [rbx+r11*8-256] vfmadd132pd xmm2{k5}, xmm7, xmm0 vfmadd132pd xmm2{k5}, xmm7, [rbx] vfmadd132pd xmm2{k5}, xmm7, [rbx]{1to2} vfmadd132pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd132pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd132pd xmm2{k5}{z}, xmm7, xmm0 vfmadd132pd xmm2{k5}{z}, xmm7, [rbx] vfmadd132pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmadd132pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd132pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd132pd ymm16, ymm13, ymm15 vfmadd132pd ymm16, ymm13, [rbx] vfmadd132pd ymm16, ymm13, [rbx]{1to4} vfmadd132pd ymm16, ymm13, [rbx+r11*8+256] vfmadd132pd ymm16, ymm13, [rbx+r11*8-256] vfmadd132pd ymm16{k5}, ymm13, ymm15 vfmadd132pd ymm16{k5}, ymm13, [rbx] vfmadd132pd ymm16{k5}, ymm13, [rbx]{1to4} vfmadd132pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmadd132pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmadd132pd ymm16{k5}{z}, ymm13, ymm15 vfmadd132pd ymm16{k5}{z}, ymm13, [rbx] vfmadd132pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmadd132pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmadd132pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmadd132pd zmm24, zmm24, zmm31 vfmadd132pd zmm24, zmm24, zmm31, {rd-sae} vfmadd132pd zmm24, zmm24, [rbx] vfmadd132pd zmm24, zmm24, [rbx]{1to8} vfmadd132pd zmm24, zmm24, [rbx+r11*8+256] vfmadd132pd zmm24, zmm24, [rbx+r11*8-256] vfmadd132pd zmm24{k5}, zmm24, zmm31 vfmadd132pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmadd132pd zmm24{k5}, zmm24, [rbx] vfmadd132pd zmm24{k5}, zmm24, [rbx]{1to8} vfmadd132pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmadd132pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmadd132pd zmm24{k5}{z}, zmm24, zmm31 vfmadd132pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmadd132pd zmm24{k5}{z}, zmm24, [rbx] vfmadd132pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmadd132pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmadd132pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmadd132ps xmm2, xmm7, xmm0 vfmadd132ps xmm2, xmm7, [rbx] vfmadd132ps xmm2, xmm7, [rbx]{1to4} vfmadd132ps xmm2, xmm7, [rbx+r11*8+256] vfmadd132ps xmm2, xmm7, [rbx+r11*8-256] vfmadd132ps xmm2{k5}, xmm7, xmm0 vfmadd132ps xmm2{k5}, xmm7, [rbx] vfmadd132ps xmm2{k5}, xmm7, [rbx]{1to4} vfmadd132ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd132ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd132ps xmm2{k5}{z}, xmm7, xmm0 vfmadd132ps xmm2{k5}{z}, xmm7, [rbx] vfmadd132ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmadd132ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd132ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd132ps ymm16, ymm13, ymm15 vfmadd132ps ymm16, ymm13, [rbx] vfmadd132ps ymm16, ymm13, [rbx]{1to8} vfmadd132ps ymm16, ymm13, [rbx+r11*8+256] vfmadd132ps ymm16, ymm13, [rbx+r11*8-256] vfmadd132ps ymm16{k5}, ymm13, ymm15 vfmadd132ps ymm16{k5}, ymm13, [rbx] vfmadd132ps ymm16{k5}, ymm13, [rbx]{1to8} vfmadd132ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmadd132ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmadd132ps ymm16{k5}{z}, ymm13, ymm15 vfmadd132ps ymm16{k5}{z}, ymm13, [rbx] vfmadd132ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmadd132ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmadd132ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmadd132ps zmm24, zmm24, zmm31 vfmadd132ps zmm24, zmm24, zmm31, {rd-sae} vfmadd132ps zmm24, zmm24, [rbx] vfmadd132ps zmm24, zmm24, [rbx]{1to16} vfmadd132ps zmm24, zmm24, [rbx+r11*8+256] vfmadd132ps zmm24, zmm24, [rbx+r11*8-256] vfmadd132ps zmm24{k5}, zmm24, zmm31 vfmadd132ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmadd132ps zmm24{k5}, zmm24, [rbx] vfmadd132ps zmm24{k5}, zmm24, [rbx]{1to16} vfmadd132ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmadd132ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmadd132ps zmm24{k5}{z}, zmm24, zmm31 vfmadd132ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmadd132ps zmm24{k5}{z}, zmm24, [rbx] vfmadd132ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmadd132ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmadd132ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmadd132sd xmm2, xmm7, xmm0 vfmadd132sd xmm2, xmm7, xmm0, {rd-sae} vfmadd132sd xmm2, xmm7, [rbx] vfmadd132sd xmm2, xmm7, [rbx+r11*8+256] vfmadd132sd xmm2, xmm7, [rbx+r11*8-256] vfmadd132sd xmm2{k5}, xmm7, xmm0 vfmadd132sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfmadd132sd xmm2{k5}, xmm7, [rbx] vfmadd132sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd132sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd132sd xmm2{k5}{z}, xmm7, xmm0 vfmadd132sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmadd132sd xmm2{k5}{z}, xmm7, [rbx] vfmadd132sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd132sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd132ss xmm2, xmm7, xmm0 vfmadd132ss xmm2, xmm7, xmm0, {rd-sae} vfmadd132ss xmm2, xmm7, [rbx] vfmadd132ss xmm2, xmm7, [rbx+r11*8+256] vfmadd132ss xmm2, xmm7, [rbx+r11*8-256] vfmadd132ss xmm2{k5}, xmm7, xmm0 vfmadd132ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfmadd132ss xmm2{k5}, xmm7, [rbx] vfmadd132ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd132ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd132ss xmm2{k5}{z}, xmm7, xmm0 vfmadd132ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmadd132ss xmm2{k5}{z}, xmm7, [rbx] vfmadd132ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd132ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd213pd xmm2, xmm7, xmm0 vfmadd213pd xmm2, xmm7, [rbx] vfmadd213pd xmm2, xmm7, [rbx]{1to2} vfmadd213pd xmm2, xmm7, [rbx+r11*8+256] vfmadd213pd xmm2, xmm7, [rbx+r11*8-256] vfmadd213pd xmm2{k5}, xmm7, xmm0 vfmadd213pd xmm2{k5}, xmm7, [rbx] vfmadd213pd xmm2{k5}, xmm7, [rbx]{1to2} vfmadd213pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd213pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd213pd xmm2{k5}{z}, xmm7, xmm0 vfmadd213pd xmm2{k5}{z}, xmm7, [rbx] vfmadd213pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmadd213pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd213pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd213pd ymm16, ymm13, ymm15 vfmadd213pd ymm16, ymm13, [rbx] vfmadd213pd ymm16, ymm13, [rbx]{1to4} vfmadd213pd ymm16, ymm13, [rbx+r11*8+256] vfmadd213pd ymm16, ymm13, [rbx+r11*8-256] vfmadd213pd ymm16{k5}, ymm13, ymm15 vfmadd213pd ymm16{k5}, ymm13, [rbx] vfmadd213pd ymm16{k5}, ymm13, [rbx]{1to4} vfmadd213pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmadd213pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmadd213pd ymm16{k5}{z}, ymm13, ymm15 vfmadd213pd ymm16{k5}{z}, ymm13, [rbx] vfmadd213pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmadd213pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmadd213pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmadd213pd zmm24, zmm24, zmm31 vfmadd213pd zmm24, zmm24, zmm31, {rd-sae} vfmadd213pd zmm24, zmm24, [rbx] vfmadd213pd zmm24, zmm24, [rbx]{1to8} vfmadd213pd zmm24, zmm24, [rbx+r11*8+256] vfmadd213pd zmm24, zmm24, [rbx+r11*8-256] vfmadd213pd zmm24{k5}, zmm24, zmm31 vfmadd213pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmadd213pd zmm24{k5}, zmm24, [rbx] vfmadd213pd zmm24{k5}, zmm24, [rbx]{1to8} vfmadd213pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmadd213pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmadd213pd zmm24{k5}{z}, zmm24, zmm31 vfmadd213pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmadd213pd zmm24{k5}{z}, zmm24, [rbx] vfmadd213pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmadd213pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmadd213pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmadd213ps xmm2, xmm7, xmm0 vfmadd213ps xmm2, xmm7, [rbx] vfmadd213ps xmm2, xmm7, [rbx]{1to4} vfmadd213ps xmm2, xmm7, [rbx+r11*8+256] vfmadd213ps xmm2, xmm7, [rbx+r11*8-256] vfmadd213ps xmm2{k5}, xmm7, xmm0 vfmadd213ps xmm2{k5}, xmm7, [rbx] vfmadd213ps xmm2{k5}, xmm7, [rbx]{1to4} vfmadd213ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd213ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd213ps xmm2{k5}{z}, xmm7, xmm0 vfmadd213ps xmm2{k5}{z}, xmm7, [rbx] vfmadd213ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmadd213ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd213ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd213ps ymm16, ymm13, ymm15 vfmadd213ps ymm16, ymm13, [rbx] vfmadd213ps ymm16, ymm13, [rbx]{1to8} vfmadd213ps ymm16, ymm13, [rbx+r11*8+256] vfmadd213ps ymm16, ymm13, [rbx+r11*8-256] vfmadd213ps ymm16{k5}, ymm13, ymm15 vfmadd213ps ymm16{k5}, ymm13, [rbx] vfmadd213ps ymm16{k5}, ymm13, [rbx]{1to8} vfmadd213ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmadd213ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmadd213ps ymm16{k5}{z}, ymm13, ymm15 vfmadd213ps ymm16{k5}{z}, ymm13, [rbx] vfmadd213ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmadd213ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmadd213ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmadd213ps zmm24, zmm24, zmm31 vfmadd213ps zmm24, zmm24, zmm31, {rd-sae} vfmadd213ps zmm24, zmm24, [rbx] vfmadd213ps zmm24, zmm24, [rbx]{1to16} vfmadd213ps zmm24, zmm24, [rbx+r11*8+256] vfmadd213ps zmm24, zmm24, [rbx+r11*8-256] vfmadd213ps zmm24{k5}, zmm24, zmm31 vfmadd213ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmadd213ps zmm24{k5}, zmm24, [rbx] vfmadd213ps zmm24{k5}, zmm24, [rbx]{1to16} vfmadd213ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmadd213ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmadd213ps zmm24{k5}{z}, zmm24, zmm31 vfmadd213ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmadd213ps zmm24{k5}{z}, zmm24, [rbx] vfmadd213ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmadd213ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmadd213ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmadd213sd xmm2, xmm7, xmm0 vfmadd213sd xmm2, xmm7, xmm0, {rd-sae} vfmadd213sd xmm2, xmm7, [rbx] vfmadd213sd xmm2, xmm7, [rbx+r11*8+256] vfmadd213sd xmm2, xmm7, [rbx+r11*8-256] vfmadd213sd xmm2{k5}, xmm7, xmm0 vfmadd213sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfmadd213sd xmm2{k5}, xmm7, [rbx] vfmadd213sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd213sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd213sd xmm2{k5}{z}, xmm7, xmm0 vfmadd213sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmadd213sd xmm2{k5}{z}, xmm7, [rbx] vfmadd213sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd213sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd213ss xmm2, xmm7, xmm0 vfmadd213ss xmm2, xmm7, xmm0, {rd-sae} vfmadd213ss xmm2, xmm7, [rbx] vfmadd213ss xmm2, xmm7, [rbx+r11*8+256] vfmadd213ss xmm2, xmm7, [rbx+r11*8-256] vfmadd213ss xmm2{k5}, xmm7, xmm0 vfmadd213ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfmadd213ss xmm2{k5}, xmm7, [rbx] vfmadd213ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd213ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd213ss xmm2{k5}{z}, xmm7, xmm0 vfmadd213ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmadd213ss xmm2{k5}{z}, xmm7, [rbx] vfmadd213ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd213ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd231pd xmm2, xmm7, xmm0 vfmadd231pd xmm2, xmm7, [rbx] vfmadd231pd xmm2, xmm7, [rbx]{1to2} vfmadd231pd xmm2, xmm7, [rbx+r11*8+256] vfmadd231pd xmm2, xmm7, [rbx+r11*8-256] vfmadd231pd xmm2{k5}, xmm7, xmm0 vfmadd231pd xmm2{k5}, xmm7, [rbx] vfmadd231pd xmm2{k5}, xmm7, [rbx]{1to2} vfmadd231pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd231pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd231pd xmm2{k5}{z}, xmm7, xmm0 vfmadd231pd xmm2{k5}{z}, xmm7, [rbx] vfmadd231pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmadd231pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd231pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd231pd ymm16, ymm13, ymm15 vfmadd231pd ymm16, ymm13, [rbx] vfmadd231pd ymm16, ymm13, [rbx]{1to4} vfmadd231pd ymm16, ymm13, [rbx+r11*8+256] vfmadd231pd ymm16, ymm13, [rbx+r11*8-256] vfmadd231pd ymm16{k5}, ymm13, ymm15 vfmadd231pd ymm16{k5}, ymm13, [rbx] vfmadd231pd ymm16{k5}, ymm13, [rbx]{1to4} vfmadd231pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmadd231pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmadd231pd ymm16{k5}{z}, ymm13, ymm15 vfmadd231pd ymm16{k5}{z}, ymm13, [rbx] vfmadd231pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmadd231pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmadd231pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmadd231pd zmm24, zmm24, zmm31 vfmadd231pd zmm24, zmm24, zmm31, {rd-sae} vfmadd231pd zmm24, zmm24, [rbx] vfmadd231pd zmm24, zmm24, [rbx]{1to8} vfmadd231pd zmm24, zmm24, [rbx+r11*8+256] vfmadd231pd zmm24, zmm24, [rbx+r11*8-256] vfmadd231pd zmm24{k5}, zmm24, zmm31 vfmadd231pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmadd231pd zmm24{k5}, zmm24, [rbx] vfmadd231pd zmm24{k5}, zmm24, [rbx]{1to8} vfmadd231pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmadd231pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmadd231pd zmm24{k5}{z}, zmm24, zmm31 vfmadd231pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmadd231pd zmm24{k5}{z}, zmm24, [rbx] vfmadd231pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmadd231pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmadd231pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmadd231ps xmm2, xmm7, xmm0 vfmadd231ps xmm2, xmm7, [rbx] vfmadd231ps xmm2, xmm7, [rbx]{1to4} vfmadd231ps xmm2, xmm7, [rbx+r11*8+256] vfmadd231ps xmm2, xmm7, [rbx+r11*8-256] vfmadd231ps xmm2{k5}, xmm7, xmm0 vfmadd231ps xmm2{k5}, xmm7, [rbx] vfmadd231ps xmm2{k5}, xmm7, [rbx]{1to4} vfmadd231ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd231ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd231ps xmm2{k5}{z}, xmm7, xmm0 vfmadd231ps xmm2{k5}{z}, xmm7, [rbx] vfmadd231ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmadd231ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd231ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd231ps ymm16, ymm13, ymm15 vfmadd231ps ymm16, ymm13, [rbx] vfmadd231ps ymm16, ymm13, [rbx]{1to8} vfmadd231ps ymm16, ymm13, [rbx+r11*8+256] vfmadd231ps ymm16, ymm13, [rbx+r11*8-256] vfmadd231ps ymm16{k5}, ymm13, ymm15 vfmadd231ps ymm16{k5}, ymm13, [rbx] vfmadd231ps ymm16{k5}, ymm13, [rbx]{1to8} vfmadd231ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmadd231ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmadd231ps ymm16{k5}{z}, ymm13, ymm15 vfmadd231ps ymm16{k5}{z}, ymm13, [rbx] vfmadd231ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmadd231ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmadd231ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmadd231ps zmm24, zmm24, zmm31 vfmadd231ps zmm24, zmm24, zmm31, {rd-sae} vfmadd231ps zmm24, zmm24, [rbx] vfmadd231ps zmm24, zmm24, [rbx]{1to16} vfmadd231ps zmm24, zmm24, [rbx+r11*8+256] vfmadd231ps zmm24, zmm24, [rbx+r11*8-256] vfmadd231ps zmm24{k5}, zmm24, zmm31 vfmadd231ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmadd231ps zmm24{k5}, zmm24, [rbx] vfmadd231ps zmm24{k5}, zmm24, [rbx]{1to16} vfmadd231ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmadd231ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmadd231ps zmm24{k5}{z}, zmm24, zmm31 vfmadd231ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmadd231ps zmm24{k5}{z}, zmm24, [rbx] vfmadd231ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmadd231ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmadd231ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmadd231sd xmm2, xmm7, xmm0 vfmadd231sd xmm2, xmm7, xmm0, {rd-sae} vfmadd231sd xmm2, xmm7, [rbx] vfmadd231sd xmm2, xmm7, [rbx+r11*8+256] vfmadd231sd xmm2, xmm7, [rbx+r11*8-256] vfmadd231sd xmm2{k5}, xmm7, xmm0 vfmadd231sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfmadd231sd xmm2{k5}, xmm7, [rbx] vfmadd231sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd231sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd231sd xmm2{k5}{z}, xmm7, xmm0 vfmadd231sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmadd231sd xmm2{k5}{z}, xmm7, [rbx] vfmadd231sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd231sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmadd231ss xmm2, xmm7, xmm0 vfmadd231ss xmm2, xmm7, xmm0, {rd-sae} vfmadd231ss xmm2, xmm7, [rbx] vfmadd231ss xmm2, xmm7, [rbx+r11*8+256] vfmadd231ss xmm2, xmm7, [rbx+r11*8-256] vfmadd231ss xmm2{k5}, xmm7, xmm0 vfmadd231ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfmadd231ss xmm2{k5}, xmm7, [rbx] vfmadd231ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfmadd231ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfmadd231ss xmm2{k5}{z}, xmm7, xmm0 vfmadd231ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmadd231ss xmm2{k5}{z}, xmm7, [rbx] vfmadd231ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmadd231ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmaddsub132pd xmm2, xmm7, xmm0 vfmaddsub132pd xmm2, xmm7, [rbx] vfmaddsub132pd xmm2, xmm7, [rbx]{1to2} vfmaddsub132pd xmm2, xmm7, [rbx+r11*8+256] vfmaddsub132pd xmm2, xmm7, [rbx+r11*8-256] vfmaddsub132pd xmm2{k5}, xmm7, xmm0 vfmaddsub132pd xmm2{k5}, xmm7, [rbx] vfmaddsub132pd xmm2{k5}, xmm7, [rbx]{1to2} vfmaddsub132pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmaddsub132pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmaddsub132pd xmm2{k5}{z}, xmm7, xmm0 vfmaddsub132pd xmm2{k5}{z}, xmm7, [rbx] vfmaddsub132pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmaddsub132pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmaddsub132pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmaddsub132pd ymm16, ymm13, ymm15 vfmaddsub132pd ymm16, ymm13, [rbx] vfmaddsub132pd ymm16, ymm13, [rbx]{1to4} vfmaddsub132pd ymm16, ymm13, [rbx+r11*8+256] vfmaddsub132pd ymm16, ymm13, [rbx+r11*8-256] vfmaddsub132pd ymm16{k5}, ymm13, ymm15 vfmaddsub132pd ymm16{k5}, ymm13, [rbx] vfmaddsub132pd ymm16{k5}, ymm13, [rbx]{1to4} vfmaddsub132pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmaddsub132pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmaddsub132pd ymm16{k5}{z}, ymm13, ymm15 vfmaddsub132pd ymm16{k5}{z}, ymm13, [rbx] vfmaddsub132pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmaddsub132pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmaddsub132pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmaddsub132pd zmm24, zmm24, zmm31 vfmaddsub132pd zmm24, zmm24, zmm31, {rd-sae} vfmaddsub132pd zmm24, zmm24, [rbx] vfmaddsub132pd zmm24, zmm24, [rbx]{1to8} vfmaddsub132pd zmm24, zmm24, [rbx+r11*8+256] vfmaddsub132pd zmm24, zmm24, [rbx+r11*8-256] vfmaddsub132pd zmm24{k5}, zmm24, zmm31 vfmaddsub132pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmaddsub132pd zmm24{k5}, zmm24, [rbx] vfmaddsub132pd zmm24{k5}, zmm24, [rbx]{1to8} vfmaddsub132pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmaddsub132pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmaddsub132pd zmm24{k5}{z}, zmm24, zmm31 vfmaddsub132pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmaddsub132pd zmm24{k5}{z}, zmm24, [rbx] vfmaddsub132pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmaddsub132pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmaddsub132pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmaddsub132ps xmm2, xmm7, xmm0 vfmaddsub132ps xmm2, xmm7, [rbx] vfmaddsub132ps xmm2, xmm7, [rbx]{1to4} vfmaddsub132ps xmm2, xmm7, [rbx+r11*8+256] vfmaddsub132ps xmm2, xmm7, [rbx+r11*8-256] vfmaddsub132ps xmm2{k5}, xmm7, xmm0 vfmaddsub132ps xmm2{k5}, xmm7, [rbx] vfmaddsub132ps xmm2{k5}, xmm7, [rbx]{1to4} vfmaddsub132ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmaddsub132ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmaddsub132ps xmm2{k5}{z}, xmm7, xmm0 vfmaddsub132ps xmm2{k5}{z}, xmm7, [rbx] vfmaddsub132ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmaddsub132ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmaddsub132ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmaddsub132ps ymm16, ymm13, ymm15 vfmaddsub132ps ymm16, ymm13, [rbx] vfmaddsub132ps ymm16, ymm13, [rbx]{1to8} vfmaddsub132ps ymm16, ymm13, [rbx+r11*8+256] vfmaddsub132ps ymm16, ymm13, [rbx+r11*8-256] vfmaddsub132ps ymm16{k5}, ymm13, ymm15 vfmaddsub132ps ymm16{k5}, ymm13, [rbx] vfmaddsub132ps ymm16{k5}, ymm13, [rbx]{1to8} vfmaddsub132ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmaddsub132ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmaddsub132ps ymm16{k5}{z}, ymm13, ymm15 vfmaddsub132ps ymm16{k5}{z}, ymm13, [rbx] vfmaddsub132ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmaddsub132ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmaddsub132ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmaddsub132ps zmm24, zmm24, zmm31 vfmaddsub132ps zmm24, zmm24, zmm31, {rd-sae} vfmaddsub132ps zmm24, zmm24, [rbx] vfmaddsub132ps zmm24, zmm24, [rbx]{1to16} vfmaddsub132ps zmm24, zmm24, [rbx+r11*8+256] vfmaddsub132ps zmm24, zmm24, [rbx+r11*8-256] vfmaddsub132ps zmm24{k5}, zmm24, zmm31 vfmaddsub132ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmaddsub132ps zmm24{k5}, zmm24, [rbx] vfmaddsub132ps zmm24{k5}, zmm24, [rbx]{1to16} vfmaddsub132ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmaddsub132ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmaddsub132ps zmm24{k5}{z}, zmm24, zmm31 vfmaddsub132ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmaddsub132ps zmm24{k5}{z}, zmm24, [rbx] vfmaddsub132ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmaddsub132ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmaddsub132ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmaddsub213pd xmm2, xmm7, xmm0 vfmaddsub213pd xmm2, xmm7, [rbx] vfmaddsub213pd xmm2, xmm7, [rbx]{1to2} vfmaddsub213pd xmm2, xmm7, [rbx+r11*8+256] vfmaddsub213pd xmm2, xmm7, [rbx+r11*8-256] vfmaddsub213pd xmm2{k5}, xmm7, xmm0 vfmaddsub213pd xmm2{k5}, xmm7, [rbx] vfmaddsub213pd xmm2{k5}, xmm7, [rbx]{1to2} vfmaddsub213pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmaddsub213pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmaddsub213pd xmm2{k5}{z}, xmm7, xmm0 vfmaddsub213pd xmm2{k5}{z}, xmm7, [rbx] vfmaddsub213pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmaddsub213pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmaddsub213pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmaddsub213pd ymm16, ymm13, ymm15 vfmaddsub213pd ymm16, ymm13, [rbx] vfmaddsub213pd ymm16, ymm13, [rbx]{1to4} vfmaddsub213pd ymm16, ymm13, [rbx+r11*8+256] vfmaddsub213pd ymm16, ymm13, [rbx+r11*8-256] vfmaddsub213pd ymm16{k5}, ymm13, ymm15 vfmaddsub213pd ymm16{k5}, ymm13, [rbx] vfmaddsub213pd ymm16{k5}, ymm13, [rbx]{1to4} vfmaddsub213pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmaddsub213pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmaddsub213pd ymm16{k5}{z}, ymm13, ymm15 vfmaddsub213pd ymm16{k5}{z}, ymm13, [rbx] vfmaddsub213pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmaddsub213pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmaddsub213pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmaddsub213pd zmm24, zmm24, zmm31 vfmaddsub213pd zmm24, zmm24, zmm31, {rd-sae} vfmaddsub213pd zmm24, zmm24, [rbx] vfmaddsub213pd zmm24, zmm24, [rbx]{1to8} vfmaddsub213pd zmm24, zmm24, [rbx+r11*8+256] vfmaddsub213pd zmm24, zmm24, [rbx+r11*8-256] vfmaddsub213pd zmm24{k5}, zmm24, zmm31 vfmaddsub213pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmaddsub213pd zmm24{k5}, zmm24, [rbx] vfmaddsub213pd zmm24{k5}, zmm24, [rbx]{1to8} vfmaddsub213pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmaddsub213pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmaddsub213pd zmm24{k5}{z}, zmm24, zmm31 vfmaddsub213pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmaddsub213pd zmm24{k5}{z}, zmm24, [rbx] vfmaddsub213pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmaddsub213pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmaddsub213pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmaddsub213ps xmm2, xmm7, xmm0 vfmaddsub213ps xmm2, xmm7, [rbx] vfmaddsub213ps xmm2, xmm7, [rbx]{1to4} vfmaddsub213ps xmm2, xmm7, [rbx+r11*8+256] vfmaddsub213ps xmm2, xmm7, [rbx+r11*8-256] vfmaddsub213ps xmm2{k5}, xmm7, xmm0 vfmaddsub213ps xmm2{k5}, xmm7, [rbx] vfmaddsub213ps xmm2{k5}, xmm7, [rbx]{1to4} vfmaddsub213ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmaddsub213ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmaddsub213ps xmm2{k5}{z}, xmm7, xmm0 vfmaddsub213ps xmm2{k5}{z}, xmm7, [rbx] vfmaddsub213ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmaddsub213ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmaddsub213ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmaddsub213ps ymm16, ymm13, ymm15 vfmaddsub213ps ymm16, ymm13, [rbx] vfmaddsub213ps ymm16, ymm13, [rbx]{1to8} vfmaddsub213ps ymm16, ymm13, [rbx+r11*8+256] vfmaddsub213ps ymm16, ymm13, [rbx+r11*8-256] vfmaddsub213ps ymm16{k5}, ymm13, ymm15 vfmaddsub213ps ymm16{k5}, ymm13, [rbx] vfmaddsub213ps ymm16{k5}, ymm13, [rbx]{1to8} vfmaddsub213ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmaddsub213ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmaddsub213ps ymm16{k5}{z}, ymm13, ymm15 vfmaddsub213ps ymm16{k5}{z}, ymm13, [rbx] vfmaddsub213ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmaddsub213ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmaddsub213ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmaddsub213ps zmm24, zmm24, zmm31 vfmaddsub213ps zmm24, zmm24, zmm31, {rd-sae} vfmaddsub213ps zmm24, zmm24, [rbx] vfmaddsub213ps zmm24, zmm24, [rbx]{1to16} vfmaddsub213ps zmm24, zmm24, [rbx+r11*8+256] vfmaddsub213ps zmm24, zmm24, [rbx+r11*8-256] vfmaddsub213ps zmm24{k5}, zmm24, zmm31 vfmaddsub213ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmaddsub213ps zmm24{k5}, zmm24, [rbx] vfmaddsub213ps zmm24{k5}, zmm24, [rbx]{1to16} vfmaddsub213ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmaddsub213ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmaddsub213ps zmm24{k5}{z}, zmm24, zmm31 vfmaddsub213ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmaddsub213ps zmm24{k5}{z}, zmm24, [rbx] vfmaddsub213ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmaddsub213ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmaddsub213ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmaddsub231pd xmm2, xmm7, xmm0 vfmaddsub231pd xmm2, xmm7, [rbx] vfmaddsub231pd xmm2, xmm7, [rbx]{1to2} vfmaddsub231pd xmm2, xmm7, [rbx+r11*8+256] vfmaddsub231pd xmm2, xmm7, [rbx+r11*8-256] vfmaddsub231pd xmm2{k5}, xmm7, xmm0 vfmaddsub231pd xmm2{k5}, xmm7, [rbx] vfmaddsub231pd xmm2{k5}, xmm7, [rbx]{1to2} vfmaddsub231pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmaddsub231pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmaddsub231pd xmm2{k5}{z}, xmm7, xmm0 vfmaddsub231pd xmm2{k5}{z}, xmm7, [rbx] vfmaddsub231pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmaddsub231pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmaddsub231pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmaddsub231pd ymm16, ymm13, ymm15 vfmaddsub231pd ymm16, ymm13, [rbx] vfmaddsub231pd ymm16, ymm13, [rbx]{1to4} vfmaddsub231pd ymm16, ymm13, [rbx+r11*8+256] vfmaddsub231pd ymm16, ymm13, [rbx+r11*8-256] vfmaddsub231pd ymm16{k5}, ymm13, ymm15 vfmaddsub231pd ymm16{k5}, ymm13, [rbx] vfmaddsub231pd ymm16{k5}, ymm13, [rbx]{1to4} vfmaddsub231pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmaddsub231pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmaddsub231pd ymm16{k5}{z}, ymm13, ymm15 vfmaddsub231pd ymm16{k5}{z}, ymm13, [rbx] vfmaddsub231pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmaddsub231pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmaddsub231pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmaddsub231pd zmm24, zmm24, zmm31 vfmaddsub231pd zmm24, zmm24, zmm31, {rd-sae} vfmaddsub231pd zmm24, zmm24, [rbx] vfmaddsub231pd zmm24, zmm24, [rbx]{1to8} vfmaddsub231pd zmm24, zmm24, [rbx+r11*8+256] vfmaddsub231pd zmm24, zmm24, [rbx+r11*8-256] vfmaddsub231pd zmm24{k5}, zmm24, zmm31 vfmaddsub231pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmaddsub231pd zmm24{k5}, zmm24, [rbx] vfmaddsub231pd zmm24{k5}, zmm24, [rbx]{1to8} vfmaddsub231pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmaddsub231pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmaddsub231pd zmm24{k5}{z}, zmm24, zmm31 vfmaddsub231pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmaddsub231pd zmm24{k5}{z}, zmm24, [rbx] vfmaddsub231pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmaddsub231pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmaddsub231pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmaddsub231ps xmm2, xmm7, xmm0 vfmaddsub231ps xmm2, xmm7, [rbx] vfmaddsub231ps xmm2, xmm7, [rbx]{1to4} vfmaddsub231ps xmm2, xmm7, [rbx+r11*8+256] vfmaddsub231ps xmm2, xmm7, [rbx+r11*8-256] vfmaddsub231ps xmm2{k5}, xmm7, xmm0 vfmaddsub231ps xmm2{k5}, xmm7, [rbx] vfmaddsub231ps xmm2{k5}, xmm7, [rbx]{1to4} vfmaddsub231ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmaddsub231ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmaddsub231ps xmm2{k5}{z}, xmm7, xmm0 vfmaddsub231ps xmm2{k5}{z}, xmm7, [rbx] vfmaddsub231ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmaddsub231ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmaddsub231ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmaddsub231ps ymm16, ymm13, ymm15 vfmaddsub231ps ymm16, ymm13, [rbx] vfmaddsub231ps ymm16, ymm13, [rbx]{1to8} vfmaddsub231ps ymm16, ymm13, [rbx+r11*8+256] vfmaddsub231ps ymm16, ymm13, [rbx+r11*8-256] vfmaddsub231ps ymm16{k5}, ymm13, ymm15 vfmaddsub231ps ymm16{k5}, ymm13, [rbx] vfmaddsub231ps ymm16{k5}, ymm13, [rbx]{1to8} vfmaddsub231ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmaddsub231ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmaddsub231ps ymm16{k5}{z}, ymm13, ymm15 vfmaddsub231ps ymm16{k5}{z}, ymm13, [rbx] vfmaddsub231ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmaddsub231ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmaddsub231ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmaddsub231ps zmm24, zmm24, zmm31 vfmaddsub231ps zmm24, zmm24, zmm31, {rd-sae} vfmaddsub231ps zmm24, zmm24, [rbx] vfmaddsub231ps zmm24, zmm24, [rbx]{1to16} vfmaddsub231ps zmm24, zmm24, [rbx+r11*8+256] vfmaddsub231ps zmm24, zmm24, [rbx+r11*8-256] vfmaddsub231ps zmm24{k5}, zmm24, zmm31 vfmaddsub231ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmaddsub231ps zmm24{k5}, zmm24, [rbx] vfmaddsub231ps zmm24{k5}, zmm24, [rbx]{1to16} vfmaddsub231ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmaddsub231ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmaddsub231ps zmm24{k5}{z}, zmm24, zmm31 vfmaddsub231ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmaddsub231ps zmm24{k5}{z}, zmm24, [rbx] vfmaddsub231ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmaddsub231ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmaddsub231ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsub132pd xmm2, xmm7, xmm0 vfmsub132pd xmm2, xmm7, [rbx] vfmsub132pd xmm2, xmm7, [rbx]{1to2} vfmsub132pd xmm2, xmm7, [rbx+r11*8+256] vfmsub132pd xmm2, xmm7, [rbx+r11*8-256] vfmsub132pd xmm2{k5}, xmm7, xmm0 vfmsub132pd xmm2{k5}, xmm7, [rbx] vfmsub132pd xmm2{k5}, xmm7, [rbx]{1to2} vfmsub132pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub132pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub132pd xmm2{k5}{z}, xmm7, xmm0 vfmsub132pd xmm2{k5}{z}, xmm7, [rbx] vfmsub132pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmsub132pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub132pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub132pd ymm16, ymm13, ymm15 vfmsub132pd ymm16, ymm13, [rbx] vfmsub132pd ymm16, ymm13, [rbx]{1to4} vfmsub132pd ymm16, ymm13, [rbx+r11*8+256] vfmsub132pd ymm16, ymm13, [rbx+r11*8-256] vfmsub132pd ymm16{k5}, ymm13, ymm15 vfmsub132pd ymm16{k5}, ymm13, [rbx] vfmsub132pd ymm16{k5}, ymm13, [rbx]{1to4} vfmsub132pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsub132pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsub132pd ymm16{k5}{z}, ymm13, ymm15 vfmsub132pd ymm16{k5}{z}, ymm13, [rbx] vfmsub132pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmsub132pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsub132pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsub132pd zmm24, zmm24, zmm31 vfmsub132pd zmm24, zmm24, zmm31, {rd-sae} vfmsub132pd zmm24, zmm24, [rbx] vfmsub132pd zmm24, zmm24, [rbx]{1to8} vfmsub132pd zmm24, zmm24, [rbx+r11*8+256] vfmsub132pd zmm24, zmm24, [rbx+r11*8-256] vfmsub132pd zmm24{k5}, zmm24, zmm31 vfmsub132pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsub132pd zmm24{k5}, zmm24, [rbx] vfmsub132pd zmm24{k5}, zmm24, [rbx]{1to8} vfmsub132pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsub132pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsub132pd zmm24{k5}{z}, zmm24, zmm31 vfmsub132pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsub132pd zmm24{k5}{z}, zmm24, [rbx] vfmsub132pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmsub132pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsub132pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsub132ps xmm2, xmm7, xmm0 vfmsub132ps xmm2, xmm7, [rbx] vfmsub132ps xmm2, xmm7, [rbx]{1to4} vfmsub132ps xmm2, xmm7, [rbx+r11*8+256] vfmsub132ps xmm2, xmm7, [rbx+r11*8-256] vfmsub132ps xmm2{k5}, xmm7, xmm0 vfmsub132ps xmm2{k5}, xmm7, [rbx] vfmsub132ps xmm2{k5}, xmm7, [rbx]{1to4} vfmsub132ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub132ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub132ps xmm2{k5}{z}, xmm7, xmm0 vfmsub132ps xmm2{k5}{z}, xmm7, [rbx] vfmsub132ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmsub132ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub132ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub132ps ymm16, ymm13, ymm15 vfmsub132ps ymm16, ymm13, [rbx] vfmsub132ps ymm16, ymm13, [rbx]{1to8} vfmsub132ps ymm16, ymm13, [rbx+r11*8+256] vfmsub132ps ymm16, ymm13, [rbx+r11*8-256] vfmsub132ps ymm16{k5}, ymm13, ymm15 vfmsub132ps ymm16{k5}, ymm13, [rbx] vfmsub132ps ymm16{k5}, ymm13, [rbx]{1to8} vfmsub132ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsub132ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsub132ps ymm16{k5}{z}, ymm13, ymm15 vfmsub132ps ymm16{k5}{z}, ymm13, [rbx] vfmsub132ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmsub132ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsub132ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsub132ps zmm24, zmm24, zmm31 vfmsub132ps zmm24, zmm24, zmm31, {rd-sae} vfmsub132ps zmm24, zmm24, [rbx] vfmsub132ps zmm24, zmm24, [rbx]{1to16} vfmsub132ps zmm24, zmm24, [rbx+r11*8+256] vfmsub132ps zmm24, zmm24, [rbx+r11*8-256] vfmsub132ps zmm24{k5}, zmm24, zmm31 vfmsub132ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsub132ps zmm24{k5}, zmm24, [rbx] vfmsub132ps zmm24{k5}, zmm24, [rbx]{1to16} vfmsub132ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsub132ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsub132ps zmm24{k5}{z}, zmm24, zmm31 vfmsub132ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsub132ps zmm24{k5}{z}, zmm24, [rbx] vfmsub132ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmsub132ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsub132ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsub132sd xmm2, xmm7, xmm0 vfmsub132sd xmm2, xmm7, xmm0, {rd-sae} vfmsub132sd xmm2, xmm7, [rbx] vfmsub132sd xmm2, xmm7, [rbx+r11*8+256] vfmsub132sd xmm2, xmm7, [rbx+r11*8-256] vfmsub132sd xmm2{k5}, xmm7, xmm0 vfmsub132sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfmsub132sd xmm2{k5}, xmm7, [rbx] vfmsub132sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub132sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub132sd xmm2{k5}{z}, xmm7, xmm0 vfmsub132sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmsub132sd xmm2{k5}{z}, xmm7, [rbx] vfmsub132sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub132sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub132ss xmm2, xmm7, xmm0 vfmsub132ss xmm2, xmm7, xmm0, {rd-sae} vfmsub132ss xmm2, xmm7, [rbx] vfmsub132ss xmm2, xmm7, [rbx+r11*8+256] vfmsub132ss xmm2, xmm7, [rbx+r11*8-256] vfmsub132ss xmm2{k5}, xmm7, xmm0 vfmsub132ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfmsub132ss xmm2{k5}, xmm7, [rbx] vfmsub132ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub132ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub132ss xmm2{k5}{z}, xmm7, xmm0 vfmsub132ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmsub132ss xmm2{k5}{z}, xmm7, [rbx] vfmsub132ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub132ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub213pd xmm2, xmm7, xmm0 vfmsub213pd xmm2, xmm7, [rbx] vfmsub213pd xmm2, xmm7, [rbx]{1to2} vfmsub213pd xmm2, xmm7, [rbx+r11*8+256] vfmsub213pd xmm2, xmm7, [rbx+r11*8-256] vfmsub213pd xmm2{k5}, xmm7, xmm0 vfmsub213pd xmm2{k5}, xmm7, [rbx] vfmsub213pd xmm2{k5}, xmm7, [rbx]{1to2} vfmsub213pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub213pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub213pd xmm2{k5}{z}, xmm7, xmm0 vfmsub213pd xmm2{k5}{z}, xmm7, [rbx] vfmsub213pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmsub213pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub213pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub213pd ymm16, ymm13, ymm15 vfmsub213pd ymm16, ymm13, [rbx] vfmsub213pd ymm16, ymm13, [rbx]{1to4} vfmsub213pd ymm16, ymm13, [rbx+r11*8+256] vfmsub213pd ymm16, ymm13, [rbx+r11*8-256] vfmsub213pd ymm16{k5}, ymm13, ymm15 vfmsub213pd ymm16{k5}, ymm13, [rbx] vfmsub213pd ymm16{k5}, ymm13, [rbx]{1to4} vfmsub213pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsub213pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsub213pd ymm16{k5}{z}, ymm13, ymm15 vfmsub213pd ymm16{k5}{z}, ymm13, [rbx] vfmsub213pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmsub213pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsub213pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsub213pd zmm24, zmm24, zmm31 vfmsub213pd zmm24, zmm24, zmm31, {rd-sae} vfmsub213pd zmm24, zmm24, [rbx] vfmsub213pd zmm24, zmm24, [rbx]{1to8} vfmsub213pd zmm24, zmm24, [rbx+r11*8+256] vfmsub213pd zmm24, zmm24, [rbx+r11*8-256] vfmsub213pd zmm24{k5}, zmm24, zmm31 vfmsub213pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsub213pd zmm24{k5}, zmm24, [rbx] vfmsub213pd zmm24{k5}, zmm24, [rbx]{1to8} vfmsub213pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsub213pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsub213pd zmm24{k5}{z}, zmm24, zmm31 vfmsub213pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsub213pd zmm24{k5}{z}, zmm24, [rbx] vfmsub213pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmsub213pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsub213pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsub213ps xmm2, xmm7, xmm0 vfmsub213ps xmm2, xmm7, [rbx] vfmsub213ps xmm2, xmm7, [rbx]{1to4} vfmsub213ps xmm2, xmm7, [rbx+r11*8+256] vfmsub213ps xmm2, xmm7, [rbx+r11*8-256] vfmsub213ps xmm2{k5}, xmm7, xmm0 vfmsub213ps xmm2{k5}, xmm7, [rbx] vfmsub213ps xmm2{k5}, xmm7, [rbx]{1to4} vfmsub213ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub213ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub213ps xmm2{k5}{z}, xmm7, xmm0 vfmsub213ps xmm2{k5}{z}, xmm7, [rbx] vfmsub213ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmsub213ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub213ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub213ps ymm16, ymm13, ymm15 vfmsub213ps ymm16, ymm13, [rbx] vfmsub213ps ymm16, ymm13, [rbx]{1to8} vfmsub213ps ymm16, ymm13, [rbx+r11*8+256] vfmsub213ps ymm16, ymm13, [rbx+r11*8-256] vfmsub213ps ymm16{k5}, ymm13, ymm15 vfmsub213ps ymm16{k5}, ymm13, [rbx] vfmsub213ps ymm16{k5}, ymm13, [rbx]{1to8} vfmsub213ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsub213ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsub213ps ymm16{k5}{z}, ymm13, ymm15 vfmsub213ps ymm16{k5}{z}, ymm13, [rbx] vfmsub213ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmsub213ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsub213ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsub213ps zmm24, zmm24, zmm31 vfmsub213ps zmm24, zmm24, zmm31, {rd-sae} vfmsub213ps zmm24, zmm24, [rbx] vfmsub213ps zmm24, zmm24, [rbx]{1to16} vfmsub213ps zmm24, zmm24, [rbx+r11*8+256] vfmsub213ps zmm24, zmm24, [rbx+r11*8-256] vfmsub213ps zmm24{k5}, zmm24, zmm31 vfmsub213ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsub213ps zmm24{k5}, zmm24, [rbx] vfmsub213ps zmm24{k5}, zmm24, [rbx]{1to16} vfmsub213ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsub213ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsub213ps zmm24{k5}{z}, zmm24, zmm31 vfmsub213ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsub213ps zmm24{k5}{z}, zmm24, [rbx] vfmsub213ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmsub213ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsub213ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsub213sd xmm2, xmm7, xmm0 vfmsub213sd xmm2, xmm7, xmm0, {rd-sae} vfmsub213sd xmm2, xmm7, [rbx] vfmsub213sd xmm2, xmm7, [rbx+r11*8+256] vfmsub213sd xmm2, xmm7, [rbx+r11*8-256] vfmsub213sd xmm2{k5}, xmm7, xmm0 vfmsub213sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfmsub213sd xmm2{k5}, xmm7, [rbx] vfmsub213sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub213sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub213sd xmm2{k5}{z}, xmm7, xmm0 vfmsub213sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmsub213sd xmm2{k5}{z}, xmm7, [rbx] vfmsub213sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub213sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub213ss xmm2, xmm7, xmm0 vfmsub213ss xmm2, xmm7, xmm0, {rd-sae} vfmsub213ss xmm2, xmm7, [rbx] vfmsub213ss xmm2, xmm7, [rbx+r11*8+256] vfmsub213ss xmm2, xmm7, [rbx+r11*8-256] vfmsub213ss xmm2{k5}, xmm7, xmm0 vfmsub213ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfmsub213ss xmm2{k5}, xmm7, [rbx] vfmsub213ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub213ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub213ss xmm2{k5}{z}, xmm7, xmm0 vfmsub213ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmsub213ss xmm2{k5}{z}, xmm7, [rbx] vfmsub213ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub213ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub231pd xmm2, xmm7, xmm0 vfmsub231pd xmm2, xmm7, [rbx] vfmsub231pd xmm2, xmm7, [rbx]{1to2} vfmsub231pd xmm2, xmm7, [rbx+r11*8+256] vfmsub231pd xmm2, xmm7, [rbx+r11*8-256] vfmsub231pd xmm2{k5}, xmm7, xmm0 vfmsub231pd xmm2{k5}, xmm7, [rbx] vfmsub231pd xmm2{k5}, xmm7, [rbx]{1to2} vfmsub231pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub231pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub231pd xmm2{k5}{z}, xmm7, xmm0 vfmsub231pd xmm2{k5}{z}, xmm7, [rbx] vfmsub231pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmsub231pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub231pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub231pd ymm16, ymm13, ymm15 vfmsub231pd ymm16, ymm13, [rbx] vfmsub231pd ymm16, ymm13, [rbx]{1to4} vfmsub231pd ymm16, ymm13, [rbx+r11*8+256] vfmsub231pd ymm16, ymm13, [rbx+r11*8-256] vfmsub231pd ymm16{k5}, ymm13, ymm15 vfmsub231pd ymm16{k5}, ymm13, [rbx] vfmsub231pd ymm16{k5}, ymm13, [rbx]{1to4} vfmsub231pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsub231pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsub231pd ymm16{k5}{z}, ymm13, ymm15 vfmsub231pd ymm16{k5}{z}, ymm13, [rbx] vfmsub231pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmsub231pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsub231pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsub231pd zmm24, zmm24, zmm31 vfmsub231pd zmm24, zmm24, zmm31, {rd-sae} vfmsub231pd zmm24, zmm24, [rbx] vfmsub231pd zmm24, zmm24, [rbx]{1to8} vfmsub231pd zmm24, zmm24, [rbx+r11*8+256] vfmsub231pd zmm24, zmm24, [rbx+r11*8-256] vfmsub231pd zmm24{k5}, zmm24, zmm31 vfmsub231pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsub231pd zmm24{k5}, zmm24, [rbx] vfmsub231pd zmm24{k5}, zmm24, [rbx]{1to8} vfmsub231pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsub231pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsub231pd zmm24{k5}{z}, zmm24, zmm31 vfmsub231pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsub231pd zmm24{k5}{z}, zmm24, [rbx] vfmsub231pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmsub231pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsub231pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsub231ps xmm2, xmm7, xmm0 vfmsub231ps xmm2, xmm7, [rbx] vfmsub231ps xmm2, xmm7, [rbx]{1to4} vfmsub231ps xmm2, xmm7, [rbx+r11*8+256] vfmsub231ps xmm2, xmm7, [rbx+r11*8-256] vfmsub231ps xmm2{k5}, xmm7, xmm0 vfmsub231ps xmm2{k5}, xmm7, [rbx] vfmsub231ps xmm2{k5}, xmm7, [rbx]{1to4} vfmsub231ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub231ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub231ps xmm2{k5}{z}, xmm7, xmm0 vfmsub231ps xmm2{k5}{z}, xmm7, [rbx] vfmsub231ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmsub231ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub231ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub231ps ymm16, ymm13, ymm15 vfmsub231ps ymm16, ymm13, [rbx] vfmsub231ps ymm16, ymm13, [rbx]{1to8} vfmsub231ps ymm16, ymm13, [rbx+r11*8+256] vfmsub231ps ymm16, ymm13, [rbx+r11*8-256] vfmsub231ps ymm16{k5}, ymm13, ymm15 vfmsub231ps ymm16{k5}, ymm13, [rbx] vfmsub231ps ymm16{k5}, ymm13, [rbx]{1to8} vfmsub231ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsub231ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsub231ps ymm16{k5}{z}, ymm13, ymm15 vfmsub231ps ymm16{k5}{z}, ymm13, [rbx] vfmsub231ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmsub231ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsub231ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsub231ps zmm24, zmm24, zmm31 vfmsub231ps zmm24, zmm24, zmm31, {rd-sae} vfmsub231ps zmm24, zmm24, [rbx] vfmsub231ps zmm24, zmm24, [rbx]{1to16} vfmsub231ps zmm24, zmm24, [rbx+r11*8+256] vfmsub231ps zmm24, zmm24, [rbx+r11*8-256] vfmsub231ps zmm24{k5}, zmm24, zmm31 vfmsub231ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsub231ps zmm24{k5}, zmm24, [rbx] vfmsub231ps zmm24{k5}, zmm24, [rbx]{1to16} vfmsub231ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsub231ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsub231ps zmm24{k5}{z}, zmm24, zmm31 vfmsub231ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsub231ps zmm24{k5}{z}, zmm24, [rbx] vfmsub231ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmsub231ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsub231ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsub231sd xmm2, xmm7, xmm0 vfmsub231sd xmm2, xmm7, xmm0, {rd-sae} vfmsub231sd xmm2, xmm7, [rbx] vfmsub231sd xmm2, xmm7, [rbx+r11*8+256] vfmsub231sd xmm2, xmm7, [rbx+r11*8-256] vfmsub231sd xmm2{k5}, xmm7, xmm0 vfmsub231sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfmsub231sd xmm2{k5}, xmm7, [rbx] vfmsub231sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub231sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub231sd xmm2{k5}{z}, xmm7, xmm0 vfmsub231sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmsub231sd xmm2{k5}{z}, xmm7, [rbx] vfmsub231sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub231sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsub231ss xmm2, xmm7, xmm0 vfmsub231ss xmm2, xmm7, xmm0, {rd-sae} vfmsub231ss xmm2, xmm7, [rbx] vfmsub231ss xmm2, xmm7, [rbx+r11*8+256] vfmsub231ss xmm2, xmm7, [rbx+r11*8-256] vfmsub231ss xmm2{k5}, xmm7, xmm0 vfmsub231ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfmsub231ss xmm2{k5}, xmm7, [rbx] vfmsub231ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsub231ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsub231ss xmm2{k5}{z}, xmm7, xmm0 vfmsub231ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfmsub231ss xmm2{k5}{z}, xmm7, [rbx] vfmsub231ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsub231ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsubadd132pd xmm2, xmm7, xmm0 vfmsubadd132pd xmm2, xmm7, [rbx] vfmsubadd132pd xmm2, xmm7, [rbx]{1to2} vfmsubadd132pd xmm2, xmm7, [rbx+r11*8+256] vfmsubadd132pd xmm2, xmm7, [rbx+r11*8-256] vfmsubadd132pd xmm2{k5}, xmm7, xmm0 vfmsubadd132pd xmm2{k5}, xmm7, [rbx] vfmsubadd132pd xmm2{k5}, xmm7, [rbx]{1to2} vfmsubadd132pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsubadd132pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsubadd132pd xmm2{k5}{z}, xmm7, xmm0 vfmsubadd132pd xmm2{k5}{z}, xmm7, [rbx] vfmsubadd132pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmsubadd132pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsubadd132pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsubadd132pd ymm16, ymm13, ymm15 vfmsubadd132pd ymm16, ymm13, [rbx] vfmsubadd132pd ymm16, ymm13, [rbx]{1to4} vfmsubadd132pd ymm16, ymm13, [rbx+r11*8+256] vfmsubadd132pd ymm16, ymm13, [rbx+r11*8-256] vfmsubadd132pd ymm16{k5}, ymm13, ymm15 vfmsubadd132pd ymm16{k5}, ymm13, [rbx] vfmsubadd132pd ymm16{k5}, ymm13, [rbx]{1to4} vfmsubadd132pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsubadd132pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsubadd132pd ymm16{k5}{z}, ymm13, ymm15 vfmsubadd132pd ymm16{k5}{z}, ymm13, [rbx] vfmsubadd132pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmsubadd132pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsubadd132pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsubadd132pd zmm24, zmm24, zmm31 vfmsubadd132pd zmm24, zmm24, zmm31, {rd-sae} vfmsubadd132pd zmm24, zmm24, [rbx] vfmsubadd132pd zmm24, zmm24, [rbx]{1to8} vfmsubadd132pd zmm24, zmm24, [rbx+r11*8+256] vfmsubadd132pd zmm24, zmm24, [rbx+r11*8-256] vfmsubadd132pd zmm24{k5}, zmm24, zmm31 vfmsubadd132pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsubadd132pd zmm24{k5}, zmm24, [rbx] vfmsubadd132pd zmm24{k5}, zmm24, [rbx]{1to8} vfmsubadd132pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsubadd132pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsubadd132pd zmm24{k5}{z}, zmm24, zmm31 vfmsubadd132pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsubadd132pd zmm24{k5}{z}, zmm24, [rbx] vfmsubadd132pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmsubadd132pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsubadd132pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsubadd132ps xmm2, xmm7, xmm0 vfmsubadd132ps xmm2, xmm7, [rbx] vfmsubadd132ps xmm2, xmm7, [rbx]{1to4} vfmsubadd132ps xmm2, xmm7, [rbx+r11*8+256] vfmsubadd132ps xmm2, xmm7, [rbx+r11*8-256] vfmsubadd132ps xmm2{k5}, xmm7, xmm0 vfmsubadd132ps xmm2{k5}, xmm7, [rbx] vfmsubadd132ps xmm2{k5}, xmm7, [rbx]{1to4} vfmsubadd132ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsubadd132ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsubadd132ps xmm2{k5}{z}, xmm7, xmm0 vfmsubadd132ps xmm2{k5}{z}, xmm7, [rbx] vfmsubadd132ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmsubadd132ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsubadd132ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsubadd132ps ymm16, ymm13, ymm15 vfmsubadd132ps ymm16, ymm13, [rbx] vfmsubadd132ps ymm16, ymm13, [rbx]{1to8} vfmsubadd132ps ymm16, ymm13, [rbx+r11*8+256] vfmsubadd132ps ymm16, ymm13, [rbx+r11*8-256] vfmsubadd132ps ymm16{k5}, ymm13, ymm15 vfmsubadd132ps ymm16{k5}, ymm13, [rbx] vfmsubadd132ps ymm16{k5}, ymm13, [rbx]{1to8} vfmsubadd132ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsubadd132ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsubadd132ps ymm16{k5}{z}, ymm13, ymm15 vfmsubadd132ps ymm16{k5}{z}, ymm13, [rbx] vfmsubadd132ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmsubadd132ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsubadd132ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsubadd132ps zmm24, zmm24, zmm31 vfmsubadd132ps zmm24, zmm24, zmm31, {rd-sae} vfmsubadd132ps zmm24, zmm24, [rbx] vfmsubadd132ps zmm24, zmm24, [rbx]{1to16} vfmsubadd132ps zmm24, zmm24, [rbx+r11*8+256] vfmsubadd132ps zmm24, zmm24, [rbx+r11*8-256] vfmsubadd132ps zmm24{k5}, zmm24, zmm31 vfmsubadd132ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsubadd132ps zmm24{k5}, zmm24, [rbx] vfmsubadd132ps zmm24{k5}, zmm24, [rbx]{1to16} vfmsubadd132ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsubadd132ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsubadd132ps zmm24{k5}{z}, zmm24, zmm31 vfmsubadd132ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsubadd132ps zmm24{k5}{z}, zmm24, [rbx] vfmsubadd132ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmsubadd132ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsubadd132ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsubadd213pd xmm2, xmm7, xmm0 vfmsubadd213pd xmm2, xmm7, [rbx] vfmsubadd213pd xmm2, xmm7, [rbx]{1to2} vfmsubadd213pd xmm2, xmm7, [rbx+r11*8+256] vfmsubadd213pd xmm2, xmm7, [rbx+r11*8-256] vfmsubadd213pd xmm2{k5}, xmm7, xmm0 vfmsubadd213pd xmm2{k5}, xmm7, [rbx] vfmsubadd213pd xmm2{k5}, xmm7, [rbx]{1to2} vfmsubadd213pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsubadd213pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsubadd213pd xmm2{k5}{z}, xmm7, xmm0 vfmsubadd213pd xmm2{k5}{z}, xmm7, [rbx] vfmsubadd213pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmsubadd213pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsubadd213pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsubadd213pd ymm16, ymm13, ymm15 vfmsubadd213pd ymm16, ymm13, [rbx] vfmsubadd213pd ymm16, ymm13, [rbx]{1to4} vfmsubadd213pd ymm16, ymm13, [rbx+r11*8+256] vfmsubadd213pd ymm16, ymm13, [rbx+r11*8-256] vfmsubadd213pd ymm16{k5}, ymm13, ymm15 vfmsubadd213pd ymm16{k5}, ymm13, [rbx] vfmsubadd213pd ymm16{k5}, ymm13, [rbx]{1to4} vfmsubadd213pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsubadd213pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsubadd213pd ymm16{k5}{z}, ymm13, ymm15 vfmsubadd213pd ymm16{k5}{z}, ymm13, [rbx] vfmsubadd213pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmsubadd213pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsubadd213pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsubadd213pd zmm24, zmm24, zmm31 vfmsubadd213pd zmm24, zmm24, zmm31, {rd-sae} vfmsubadd213pd zmm24, zmm24, [rbx] vfmsubadd213pd zmm24, zmm24, [rbx]{1to8} vfmsubadd213pd zmm24, zmm24, [rbx+r11*8+256] vfmsubadd213pd zmm24, zmm24, [rbx+r11*8-256] vfmsubadd213pd zmm24{k5}, zmm24, zmm31 vfmsubadd213pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsubadd213pd zmm24{k5}, zmm24, [rbx] vfmsubadd213pd zmm24{k5}, zmm24, [rbx]{1to8} vfmsubadd213pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsubadd213pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsubadd213pd zmm24{k5}{z}, zmm24, zmm31 vfmsubadd213pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsubadd213pd zmm24{k5}{z}, zmm24, [rbx] vfmsubadd213pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmsubadd213pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsubadd213pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsubadd213ps xmm2, xmm7, xmm0 vfmsubadd213ps xmm2, xmm7, [rbx] vfmsubadd213ps xmm2, xmm7, [rbx]{1to4} vfmsubadd213ps xmm2, xmm7, [rbx+r11*8+256] vfmsubadd213ps xmm2, xmm7, [rbx+r11*8-256] vfmsubadd213ps xmm2{k5}, xmm7, xmm0 vfmsubadd213ps xmm2{k5}, xmm7, [rbx] vfmsubadd213ps xmm2{k5}, xmm7, [rbx]{1to4} vfmsubadd213ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsubadd213ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsubadd213ps xmm2{k5}{z}, xmm7, xmm0 vfmsubadd213ps xmm2{k5}{z}, xmm7, [rbx] vfmsubadd213ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmsubadd213ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsubadd213ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsubadd213ps ymm16, ymm13, ymm15 vfmsubadd213ps ymm16, ymm13, [rbx] vfmsubadd213ps ymm16, ymm13, [rbx]{1to8} vfmsubadd213ps ymm16, ymm13, [rbx+r11*8+256] vfmsubadd213ps ymm16, ymm13, [rbx+r11*8-256] vfmsubadd213ps ymm16{k5}, ymm13, ymm15 vfmsubadd213ps ymm16{k5}, ymm13, [rbx] vfmsubadd213ps ymm16{k5}, ymm13, [rbx]{1to8} vfmsubadd213ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsubadd213ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsubadd213ps ymm16{k5}{z}, ymm13, ymm15 vfmsubadd213ps ymm16{k5}{z}, ymm13, [rbx] vfmsubadd213ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmsubadd213ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsubadd213ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsubadd213ps zmm24, zmm24, zmm31 vfmsubadd213ps zmm24, zmm24, zmm31, {rd-sae} vfmsubadd213ps zmm24, zmm24, [rbx] vfmsubadd213ps zmm24, zmm24, [rbx]{1to16} vfmsubadd213ps zmm24, zmm24, [rbx+r11*8+256] vfmsubadd213ps zmm24, zmm24, [rbx+r11*8-256] vfmsubadd213ps zmm24{k5}, zmm24, zmm31 vfmsubadd213ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsubadd213ps zmm24{k5}, zmm24, [rbx] vfmsubadd213ps zmm24{k5}, zmm24, [rbx]{1to16} vfmsubadd213ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsubadd213ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsubadd213ps zmm24{k5}{z}, zmm24, zmm31 vfmsubadd213ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsubadd213ps zmm24{k5}{z}, zmm24, [rbx] vfmsubadd213ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmsubadd213ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsubadd213ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsubadd231pd xmm2, xmm7, xmm0 vfmsubadd231pd xmm2, xmm7, [rbx] vfmsubadd231pd xmm2, xmm7, [rbx]{1to2} vfmsubadd231pd xmm2, xmm7, [rbx+r11*8+256] vfmsubadd231pd xmm2, xmm7, [rbx+r11*8-256] vfmsubadd231pd xmm2{k5}, xmm7, xmm0 vfmsubadd231pd xmm2{k5}, xmm7, [rbx] vfmsubadd231pd xmm2{k5}, xmm7, [rbx]{1to2} vfmsubadd231pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsubadd231pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsubadd231pd xmm2{k5}{z}, xmm7, xmm0 vfmsubadd231pd xmm2{k5}{z}, xmm7, [rbx] vfmsubadd231pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfmsubadd231pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsubadd231pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsubadd231pd ymm16, ymm13, ymm15 vfmsubadd231pd ymm16, ymm13, [rbx] vfmsubadd231pd ymm16, ymm13, [rbx]{1to4} vfmsubadd231pd ymm16, ymm13, [rbx+r11*8+256] vfmsubadd231pd ymm16, ymm13, [rbx+r11*8-256] vfmsubadd231pd ymm16{k5}, ymm13, ymm15 vfmsubadd231pd ymm16{k5}, ymm13, [rbx] vfmsubadd231pd ymm16{k5}, ymm13, [rbx]{1to4} vfmsubadd231pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsubadd231pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsubadd231pd ymm16{k5}{z}, ymm13, ymm15 vfmsubadd231pd ymm16{k5}{z}, ymm13, [rbx] vfmsubadd231pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfmsubadd231pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsubadd231pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsubadd231pd zmm24, zmm24, zmm31 vfmsubadd231pd zmm24, zmm24, zmm31, {rd-sae} vfmsubadd231pd zmm24, zmm24, [rbx] vfmsubadd231pd zmm24, zmm24, [rbx]{1to8} vfmsubadd231pd zmm24, zmm24, [rbx+r11*8+256] vfmsubadd231pd zmm24, zmm24, [rbx+r11*8-256] vfmsubadd231pd zmm24{k5}, zmm24, zmm31 vfmsubadd231pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsubadd231pd zmm24{k5}, zmm24, [rbx] vfmsubadd231pd zmm24{k5}, zmm24, [rbx]{1to8} vfmsubadd231pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsubadd231pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsubadd231pd zmm24{k5}{z}, zmm24, zmm31 vfmsubadd231pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsubadd231pd zmm24{k5}{z}, zmm24, [rbx] vfmsubadd231pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfmsubadd231pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsubadd231pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfmsubadd231ps xmm2, xmm7, xmm0 vfmsubadd231ps xmm2, xmm7, [rbx] vfmsubadd231ps xmm2, xmm7, [rbx]{1to4} vfmsubadd231ps xmm2, xmm7, [rbx+r11*8+256] vfmsubadd231ps xmm2, xmm7, [rbx+r11*8-256] vfmsubadd231ps xmm2{k5}, xmm7, xmm0 vfmsubadd231ps xmm2{k5}, xmm7, [rbx] vfmsubadd231ps xmm2{k5}, xmm7, [rbx]{1to4} vfmsubadd231ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfmsubadd231ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfmsubadd231ps xmm2{k5}{z}, xmm7, xmm0 vfmsubadd231ps xmm2{k5}{z}, xmm7, [rbx] vfmsubadd231ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfmsubadd231ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfmsubadd231ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfmsubadd231ps ymm16, ymm13, ymm15 vfmsubadd231ps ymm16, ymm13, [rbx] vfmsubadd231ps ymm16, ymm13, [rbx]{1to8} vfmsubadd231ps ymm16, ymm13, [rbx+r11*8+256] vfmsubadd231ps ymm16, ymm13, [rbx+r11*8-256] vfmsubadd231ps ymm16{k5}, ymm13, ymm15 vfmsubadd231ps ymm16{k5}, ymm13, [rbx] vfmsubadd231ps ymm16{k5}, ymm13, [rbx]{1to8} vfmsubadd231ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfmsubadd231ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfmsubadd231ps ymm16{k5}{z}, ymm13, ymm15 vfmsubadd231ps ymm16{k5}{z}, ymm13, [rbx] vfmsubadd231ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfmsubadd231ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfmsubadd231ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfmsubadd231ps zmm24, zmm24, zmm31 vfmsubadd231ps zmm24, zmm24, zmm31, {rd-sae} vfmsubadd231ps zmm24, zmm24, [rbx] vfmsubadd231ps zmm24, zmm24, [rbx]{1to16} vfmsubadd231ps zmm24, zmm24, [rbx+r11*8+256] vfmsubadd231ps zmm24, zmm24, [rbx+r11*8-256] vfmsubadd231ps zmm24{k5}, zmm24, zmm31 vfmsubadd231ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfmsubadd231ps zmm24{k5}, zmm24, [rbx] vfmsubadd231ps zmm24{k5}, zmm24, [rbx]{1to16} vfmsubadd231ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfmsubadd231ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfmsubadd231ps zmm24{k5}{z}, zmm24, zmm31 vfmsubadd231ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfmsubadd231ps zmm24{k5}{z}, zmm24, [rbx] vfmsubadd231ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfmsubadd231ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfmsubadd231ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmadd132pd xmm2, xmm7, xmm0 vfnmadd132pd xmm2, xmm7, [rbx] vfnmadd132pd xmm2, xmm7, [rbx]{1to2} vfnmadd132pd xmm2, xmm7, [rbx+r11*8+256] vfnmadd132pd xmm2, xmm7, [rbx+r11*8-256] vfnmadd132pd xmm2{k5}, xmm7, xmm0 vfnmadd132pd xmm2{k5}, xmm7, [rbx] vfnmadd132pd xmm2{k5}, xmm7, [rbx]{1to2} vfnmadd132pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd132pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd132pd xmm2{k5}{z}, xmm7, xmm0 vfnmadd132pd xmm2{k5}{z}, xmm7, [rbx] vfnmadd132pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfnmadd132pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd132pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd132pd ymm16, ymm13, ymm15 vfnmadd132pd ymm16, ymm13, [rbx] vfnmadd132pd ymm16, ymm13, [rbx]{1to4} vfnmadd132pd ymm16, ymm13, [rbx+r11*8+256] vfnmadd132pd ymm16, ymm13, [rbx+r11*8-256] vfnmadd132pd ymm16{k5}, ymm13, ymm15 vfnmadd132pd ymm16{k5}, ymm13, [rbx] vfnmadd132pd ymm16{k5}, ymm13, [rbx]{1to4} vfnmadd132pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmadd132pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmadd132pd ymm16{k5}{z}, ymm13, ymm15 vfnmadd132pd ymm16{k5}{z}, ymm13, [rbx] vfnmadd132pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfnmadd132pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmadd132pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmadd132pd zmm24, zmm24, zmm31 vfnmadd132pd zmm24, zmm24, zmm31, {rd-sae} vfnmadd132pd zmm24, zmm24, [rbx] vfnmadd132pd zmm24, zmm24, [rbx]{1to8} vfnmadd132pd zmm24, zmm24, [rbx+r11*8+256] vfnmadd132pd zmm24, zmm24, [rbx+r11*8-256] vfnmadd132pd zmm24{k5}, zmm24, zmm31 vfnmadd132pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmadd132pd zmm24{k5}, zmm24, [rbx] vfnmadd132pd zmm24{k5}, zmm24, [rbx]{1to8} vfnmadd132pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmadd132pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmadd132pd zmm24{k5}{z}, zmm24, zmm31 vfnmadd132pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmadd132pd zmm24{k5}{z}, zmm24, [rbx] vfnmadd132pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfnmadd132pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmadd132pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmadd132ps xmm2, xmm7, xmm0 vfnmadd132ps xmm2, xmm7, [rbx] vfnmadd132ps xmm2, xmm7, [rbx]{1to4} vfnmadd132ps xmm2, xmm7, [rbx+r11*8+256] vfnmadd132ps xmm2, xmm7, [rbx+r11*8-256] vfnmadd132ps xmm2{k5}, xmm7, xmm0 vfnmadd132ps xmm2{k5}, xmm7, [rbx] vfnmadd132ps xmm2{k5}, xmm7, [rbx]{1to4} vfnmadd132ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd132ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd132ps xmm2{k5}{z}, xmm7, xmm0 vfnmadd132ps xmm2{k5}{z}, xmm7, [rbx] vfnmadd132ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfnmadd132ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd132ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd132ps ymm16, ymm13, ymm15 vfnmadd132ps ymm16, ymm13, [rbx] vfnmadd132ps ymm16, ymm13, [rbx]{1to8} vfnmadd132ps ymm16, ymm13, [rbx+r11*8+256] vfnmadd132ps ymm16, ymm13, [rbx+r11*8-256] vfnmadd132ps ymm16{k5}, ymm13, ymm15 vfnmadd132ps ymm16{k5}, ymm13, [rbx] vfnmadd132ps ymm16{k5}, ymm13, [rbx]{1to8} vfnmadd132ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmadd132ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmadd132ps ymm16{k5}{z}, ymm13, ymm15 vfnmadd132ps ymm16{k5}{z}, ymm13, [rbx] vfnmadd132ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfnmadd132ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmadd132ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmadd132ps zmm24, zmm24, zmm31 vfnmadd132ps zmm24, zmm24, zmm31, {rd-sae} vfnmadd132ps zmm24, zmm24, [rbx] vfnmadd132ps zmm24, zmm24, [rbx]{1to16} vfnmadd132ps zmm24, zmm24, [rbx+r11*8+256] vfnmadd132ps zmm24, zmm24, [rbx+r11*8-256] vfnmadd132ps zmm24{k5}, zmm24, zmm31 vfnmadd132ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmadd132ps zmm24{k5}, zmm24, [rbx] vfnmadd132ps zmm24{k5}, zmm24, [rbx]{1to16} vfnmadd132ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmadd132ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmadd132ps zmm24{k5}{z}, zmm24, zmm31 vfnmadd132ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmadd132ps zmm24{k5}{z}, zmm24, [rbx] vfnmadd132ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfnmadd132ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmadd132ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmadd132sd xmm2, xmm7, xmm0 vfnmadd132sd xmm2, xmm7, xmm0, {rd-sae} vfnmadd132sd xmm2, xmm7, [rbx] vfnmadd132sd xmm2, xmm7, [rbx+r11*8+256] vfnmadd132sd xmm2, xmm7, [rbx+r11*8-256] vfnmadd132sd xmm2{k5}, xmm7, xmm0 vfnmadd132sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmadd132sd xmm2{k5}, xmm7, [rbx] vfnmadd132sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd132sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd132sd xmm2{k5}{z}, xmm7, xmm0 vfnmadd132sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmadd132sd xmm2{k5}{z}, xmm7, [rbx] vfnmadd132sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd132sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd132ss xmm2, xmm7, xmm0 vfnmadd132ss xmm2, xmm7, xmm0, {rd-sae} vfnmadd132ss xmm2, xmm7, [rbx] vfnmadd132ss xmm2, xmm7, [rbx+r11*8+256] vfnmadd132ss xmm2, xmm7, [rbx+r11*8-256] vfnmadd132ss xmm2{k5}, xmm7, xmm0 vfnmadd132ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmadd132ss xmm2{k5}, xmm7, [rbx] vfnmadd132ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd132ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd132ss xmm2{k5}{z}, xmm7, xmm0 vfnmadd132ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmadd132ss xmm2{k5}{z}, xmm7, [rbx] vfnmadd132ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd132ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd213pd xmm2, xmm7, xmm0 vfnmadd213pd xmm2, xmm7, [rbx] vfnmadd213pd xmm2, xmm7, [rbx]{1to2} vfnmadd213pd xmm2, xmm7, [rbx+r11*8+256] vfnmadd213pd xmm2, xmm7, [rbx+r11*8-256] vfnmadd213pd xmm2{k5}, xmm7, xmm0 vfnmadd213pd xmm2{k5}, xmm7, [rbx] vfnmadd213pd xmm2{k5}, xmm7, [rbx]{1to2} vfnmadd213pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd213pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd213pd xmm2{k5}{z}, xmm7, xmm0 vfnmadd213pd xmm2{k5}{z}, xmm7, [rbx] vfnmadd213pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfnmadd213pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd213pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd213pd ymm16, ymm13, ymm15 vfnmadd213pd ymm16, ymm13, [rbx] vfnmadd213pd ymm16, ymm13, [rbx]{1to4} vfnmadd213pd ymm16, ymm13, [rbx+r11*8+256] vfnmadd213pd ymm16, ymm13, [rbx+r11*8-256] vfnmadd213pd ymm16{k5}, ymm13, ymm15 vfnmadd213pd ymm16{k5}, ymm13, [rbx] vfnmadd213pd ymm16{k5}, ymm13, [rbx]{1to4} vfnmadd213pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmadd213pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmadd213pd ymm16{k5}{z}, ymm13, ymm15 vfnmadd213pd ymm16{k5}{z}, ymm13, [rbx] vfnmadd213pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfnmadd213pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmadd213pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmadd213pd zmm24, zmm24, zmm31 vfnmadd213pd zmm24, zmm24, zmm31, {rd-sae} vfnmadd213pd zmm24, zmm24, [rbx] vfnmadd213pd zmm24, zmm24, [rbx]{1to8} vfnmadd213pd zmm24, zmm24, [rbx+r11*8+256] vfnmadd213pd zmm24, zmm24, [rbx+r11*8-256] vfnmadd213pd zmm24{k5}, zmm24, zmm31 vfnmadd213pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmadd213pd zmm24{k5}, zmm24, [rbx] vfnmadd213pd zmm24{k5}, zmm24, [rbx]{1to8} vfnmadd213pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmadd213pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmadd213pd zmm24{k5}{z}, zmm24, zmm31 vfnmadd213pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmadd213pd zmm24{k5}{z}, zmm24, [rbx] vfnmadd213pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfnmadd213pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmadd213pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmadd213ps xmm2, xmm7, xmm0 vfnmadd213ps xmm2, xmm7, [rbx] vfnmadd213ps xmm2, xmm7, [rbx]{1to4} vfnmadd213ps xmm2, xmm7, [rbx+r11*8+256] vfnmadd213ps xmm2, xmm7, [rbx+r11*8-256] vfnmadd213ps xmm2{k5}, xmm7, xmm0 vfnmadd213ps xmm2{k5}, xmm7, [rbx] vfnmadd213ps xmm2{k5}, xmm7, [rbx]{1to4} vfnmadd213ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd213ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd213ps xmm2{k5}{z}, xmm7, xmm0 vfnmadd213ps xmm2{k5}{z}, xmm7, [rbx] vfnmadd213ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfnmadd213ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd213ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd213ps ymm16, ymm13, ymm15 vfnmadd213ps ymm16, ymm13, [rbx] vfnmadd213ps ymm16, ymm13, [rbx]{1to8} vfnmadd213ps ymm16, ymm13, [rbx+r11*8+256] vfnmadd213ps ymm16, ymm13, [rbx+r11*8-256] vfnmadd213ps ymm16{k5}, ymm13, ymm15 vfnmadd213ps ymm16{k5}, ymm13, [rbx] vfnmadd213ps ymm16{k5}, ymm13, [rbx]{1to8} vfnmadd213ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmadd213ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmadd213ps ymm16{k5}{z}, ymm13, ymm15 vfnmadd213ps ymm16{k5}{z}, ymm13, [rbx] vfnmadd213ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfnmadd213ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmadd213ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmadd213ps zmm24, zmm24, zmm31 vfnmadd213ps zmm24, zmm24, zmm31, {rd-sae} vfnmadd213ps zmm24, zmm24, [rbx] vfnmadd213ps zmm24, zmm24, [rbx]{1to16} vfnmadd213ps zmm24, zmm24, [rbx+r11*8+256] vfnmadd213ps zmm24, zmm24, [rbx+r11*8-256] vfnmadd213ps zmm24{k5}, zmm24, zmm31 vfnmadd213ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmadd213ps zmm24{k5}, zmm24, [rbx] vfnmadd213ps zmm24{k5}, zmm24, [rbx]{1to16} vfnmadd213ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmadd213ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmadd213ps zmm24{k5}{z}, zmm24, zmm31 vfnmadd213ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmadd213ps zmm24{k5}{z}, zmm24, [rbx] vfnmadd213ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfnmadd213ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmadd213ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmadd213sd xmm2, xmm7, xmm0 vfnmadd213sd xmm2, xmm7, xmm0, {rd-sae} vfnmadd213sd xmm2, xmm7, [rbx] vfnmadd213sd xmm2, xmm7, [rbx+r11*8+256] vfnmadd213sd xmm2, xmm7, [rbx+r11*8-256] vfnmadd213sd xmm2{k5}, xmm7, xmm0 vfnmadd213sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmadd213sd xmm2{k5}, xmm7, [rbx] vfnmadd213sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd213sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd213sd xmm2{k5}{z}, xmm7, xmm0 vfnmadd213sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmadd213sd xmm2{k5}{z}, xmm7, [rbx] vfnmadd213sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd213sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd213ss xmm2, xmm7, xmm0 vfnmadd213ss xmm2, xmm7, xmm0, {rd-sae} vfnmadd213ss xmm2, xmm7, [rbx] vfnmadd213ss xmm2, xmm7, [rbx+r11*8+256] vfnmadd213ss xmm2, xmm7, [rbx+r11*8-256] vfnmadd213ss xmm2{k5}, xmm7, xmm0 vfnmadd213ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmadd213ss xmm2{k5}, xmm7, [rbx] vfnmadd213ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd213ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd213ss xmm2{k5}{z}, xmm7, xmm0 vfnmadd213ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmadd213ss xmm2{k5}{z}, xmm7, [rbx] vfnmadd213ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd213ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd231pd xmm2, xmm7, xmm0 vfnmadd231pd xmm2, xmm7, [rbx] vfnmadd231pd xmm2, xmm7, [rbx]{1to2} vfnmadd231pd xmm2, xmm7, [rbx+r11*8+256] vfnmadd231pd xmm2, xmm7, [rbx+r11*8-256] vfnmadd231pd xmm2{k5}, xmm7, xmm0 vfnmadd231pd xmm2{k5}, xmm7, [rbx] vfnmadd231pd xmm2{k5}, xmm7, [rbx]{1to2} vfnmadd231pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd231pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd231pd xmm2{k5}{z}, xmm7, xmm0 vfnmadd231pd xmm2{k5}{z}, xmm7, [rbx] vfnmadd231pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfnmadd231pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd231pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd231pd ymm16, ymm13, ymm15 vfnmadd231pd ymm16, ymm13, [rbx] vfnmadd231pd ymm16, ymm13, [rbx]{1to4} vfnmadd231pd ymm16, ymm13, [rbx+r11*8+256] vfnmadd231pd ymm16, ymm13, [rbx+r11*8-256] vfnmadd231pd ymm16{k5}, ymm13, ymm15 vfnmadd231pd ymm16{k5}, ymm13, [rbx] vfnmadd231pd ymm16{k5}, ymm13, [rbx]{1to4} vfnmadd231pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmadd231pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmadd231pd ymm16{k5}{z}, ymm13, ymm15 vfnmadd231pd ymm16{k5}{z}, ymm13, [rbx] vfnmadd231pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfnmadd231pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmadd231pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmadd231pd zmm24, zmm24, zmm31 vfnmadd231pd zmm24, zmm24, zmm31, {rd-sae} vfnmadd231pd zmm24, zmm24, [rbx] vfnmadd231pd zmm24, zmm24, [rbx]{1to8} vfnmadd231pd zmm24, zmm24, [rbx+r11*8+256] vfnmadd231pd zmm24, zmm24, [rbx+r11*8-256] vfnmadd231pd zmm24{k5}, zmm24, zmm31 vfnmadd231pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmadd231pd zmm24{k5}, zmm24, [rbx] vfnmadd231pd zmm24{k5}, zmm24, [rbx]{1to8} vfnmadd231pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmadd231pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmadd231pd zmm24{k5}{z}, zmm24, zmm31 vfnmadd231pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmadd231pd zmm24{k5}{z}, zmm24, [rbx] vfnmadd231pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfnmadd231pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmadd231pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmadd231ps xmm2, xmm7, xmm0 vfnmadd231ps xmm2, xmm7, [rbx] vfnmadd231ps xmm2, xmm7, [rbx]{1to4} vfnmadd231ps xmm2, xmm7, [rbx+r11*8+256] vfnmadd231ps xmm2, xmm7, [rbx+r11*8-256] vfnmadd231ps xmm2{k5}, xmm7, xmm0 vfnmadd231ps xmm2{k5}, xmm7, [rbx] vfnmadd231ps xmm2{k5}, xmm7, [rbx]{1to4} vfnmadd231ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd231ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd231ps xmm2{k5}{z}, xmm7, xmm0 vfnmadd231ps xmm2{k5}{z}, xmm7, [rbx] vfnmadd231ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfnmadd231ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd231ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd231ps ymm16, ymm13, ymm15 vfnmadd231ps ymm16, ymm13, [rbx] vfnmadd231ps ymm16, ymm13, [rbx]{1to8} vfnmadd231ps ymm16, ymm13, [rbx+r11*8+256] vfnmadd231ps ymm16, ymm13, [rbx+r11*8-256] vfnmadd231ps ymm16{k5}, ymm13, ymm15 vfnmadd231ps ymm16{k5}, ymm13, [rbx] vfnmadd231ps ymm16{k5}, ymm13, [rbx]{1to8} vfnmadd231ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmadd231ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmadd231ps ymm16{k5}{z}, ymm13, ymm15 vfnmadd231ps ymm16{k5}{z}, ymm13, [rbx] vfnmadd231ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfnmadd231ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmadd231ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmadd231ps zmm24, zmm24, zmm31 vfnmadd231ps zmm24, zmm24, zmm31, {rd-sae} vfnmadd231ps zmm24, zmm24, [rbx] vfnmadd231ps zmm24, zmm24, [rbx]{1to16} vfnmadd231ps zmm24, zmm24, [rbx+r11*8+256] vfnmadd231ps zmm24, zmm24, [rbx+r11*8-256] vfnmadd231ps zmm24{k5}, zmm24, zmm31 vfnmadd231ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmadd231ps zmm24{k5}, zmm24, [rbx] vfnmadd231ps zmm24{k5}, zmm24, [rbx]{1to16} vfnmadd231ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmadd231ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmadd231ps zmm24{k5}{z}, zmm24, zmm31 vfnmadd231ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmadd231ps zmm24{k5}{z}, zmm24, [rbx] vfnmadd231ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfnmadd231ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmadd231ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmadd231sd xmm2, xmm7, xmm0 vfnmadd231sd xmm2, xmm7, xmm0, {rd-sae} vfnmadd231sd xmm2, xmm7, [rbx] vfnmadd231sd xmm2, xmm7, [rbx+r11*8+256] vfnmadd231sd xmm2, xmm7, [rbx+r11*8-256] vfnmadd231sd xmm2{k5}, xmm7, xmm0 vfnmadd231sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmadd231sd xmm2{k5}, xmm7, [rbx] vfnmadd231sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd231sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd231sd xmm2{k5}{z}, xmm7, xmm0 vfnmadd231sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmadd231sd xmm2{k5}{z}, xmm7, [rbx] vfnmadd231sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd231sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmadd231ss xmm2, xmm7, xmm0 vfnmadd231ss xmm2, xmm7, xmm0, {rd-sae} vfnmadd231ss xmm2, xmm7, [rbx] vfnmadd231ss xmm2, xmm7, [rbx+r11*8+256] vfnmadd231ss xmm2, xmm7, [rbx+r11*8-256] vfnmadd231ss xmm2{k5}, xmm7, xmm0 vfnmadd231ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmadd231ss xmm2{k5}, xmm7, [rbx] vfnmadd231ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmadd231ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmadd231ss xmm2{k5}{z}, xmm7, xmm0 vfnmadd231ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmadd231ss xmm2{k5}{z}, xmm7, [rbx] vfnmadd231ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmadd231ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub132pd xmm2, xmm7, xmm0 vfnmsub132pd xmm2, xmm7, [rbx] vfnmsub132pd xmm2, xmm7, [rbx]{1to2} vfnmsub132pd xmm2, xmm7, [rbx+r11*8+256] vfnmsub132pd xmm2, xmm7, [rbx+r11*8-256] vfnmsub132pd xmm2{k5}, xmm7, xmm0 vfnmsub132pd xmm2{k5}, xmm7, [rbx] vfnmsub132pd xmm2{k5}, xmm7, [rbx]{1to2} vfnmsub132pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub132pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub132pd xmm2{k5}{z}, xmm7, xmm0 vfnmsub132pd xmm2{k5}{z}, xmm7, [rbx] vfnmsub132pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfnmsub132pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub132pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub132pd ymm16, ymm13, ymm15 vfnmsub132pd ymm16, ymm13, [rbx] vfnmsub132pd ymm16, ymm13, [rbx]{1to4} vfnmsub132pd ymm16, ymm13, [rbx+r11*8+256] vfnmsub132pd ymm16, ymm13, [rbx+r11*8-256] vfnmsub132pd ymm16{k5}, ymm13, ymm15 vfnmsub132pd ymm16{k5}, ymm13, [rbx] vfnmsub132pd ymm16{k5}, ymm13, [rbx]{1to4} vfnmsub132pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmsub132pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmsub132pd ymm16{k5}{z}, ymm13, ymm15 vfnmsub132pd ymm16{k5}{z}, ymm13, [rbx] vfnmsub132pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfnmsub132pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmsub132pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmsub132pd zmm24, zmm24, zmm31 vfnmsub132pd zmm24, zmm24, zmm31, {rd-sae} vfnmsub132pd zmm24, zmm24, [rbx] vfnmsub132pd zmm24, zmm24, [rbx]{1to8} vfnmsub132pd zmm24, zmm24, [rbx+r11*8+256] vfnmsub132pd zmm24, zmm24, [rbx+r11*8-256] vfnmsub132pd zmm24{k5}, zmm24, zmm31 vfnmsub132pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmsub132pd zmm24{k5}, zmm24, [rbx] vfnmsub132pd zmm24{k5}, zmm24, [rbx]{1to8} vfnmsub132pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmsub132pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmsub132pd zmm24{k5}{z}, zmm24, zmm31 vfnmsub132pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmsub132pd zmm24{k5}{z}, zmm24, [rbx] vfnmsub132pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfnmsub132pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmsub132pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmsub132ps xmm2, xmm7, xmm0 vfnmsub132ps xmm2, xmm7, [rbx] vfnmsub132ps xmm2, xmm7, [rbx]{1to4} vfnmsub132ps xmm2, xmm7, [rbx+r11*8+256] vfnmsub132ps xmm2, xmm7, [rbx+r11*8-256] vfnmsub132ps xmm2{k5}, xmm7, xmm0 vfnmsub132ps xmm2{k5}, xmm7, [rbx] vfnmsub132ps xmm2{k5}, xmm7, [rbx]{1to4} vfnmsub132ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub132ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub132ps xmm2{k5}{z}, xmm7, xmm0 vfnmsub132ps xmm2{k5}{z}, xmm7, [rbx] vfnmsub132ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfnmsub132ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub132ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub132ps ymm16, ymm13, ymm15 vfnmsub132ps ymm16, ymm13, [rbx] vfnmsub132ps ymm16, ymm13, [rbx]{1to8} vfnmsub132ps ymm16, ymm13, [rbx+r11*8+256] vfnmsub132ps ymm16, ymm13, [rbx+r11*8-256] vfnmsub132ps ymm16{k5}, ymm13, ymm15 vfnmsub132ps ymm16{k5}, ymm13, [rbx] vfnmsub132ps ymm16{k5}, ymm13, [rbx]{1to8} vfnmsub132ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmsub132ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmsub132ps ymm16{k5}{z}, ymm13, ymm15 vfnmsub132ps ymm16{k5}{z}, ymm13, [rbx] vfnmsub132ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfnmsub132ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmsub132ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmsub132ps zmm24, zmm24, zmm31 vfnmsub132ps zmm24, zmm24, zmm31, {rd-sae} vfnmsub132ps zmm24, zmm24, [rbx] vfnmsub132ps zmm24, zmm24, [rbx]{1to16} vfnmsub132ps zmm24, zmm24, [rbx+r11*8+256] vfnmsub132ps zmm24, zmm24, [rbx+r11*8-256] vfnmsub132ps zmm24{k5}, zmm24, zmm31 vfnmsub132ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmsub132ps zmm24{k5}, zmm24, [rbx] vfnmsub132ps zmm24{k5}, zmm24, [rbx]{1to16} vfnmsub132ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmsub132ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmsub132ps zmm24{k5}{z}, zmm24, zmm31 vfnmsub132ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmsub132ps zmm24{k5}{z}, zmm24, [rbx] vfnmsub132ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfnmsub132ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmsub132ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmsub132sd xmm2, xmm7, xmm0 vfnmsub132sd xmm2, xmm7, xmm0, {rd-sae} vfnmsub132sd xmm2, xmm7, [rbx] vfnmsub132sd xmm2, xmm7, [rbx+r11*8+256] vfnmsub132sd xmm2, xmm7, [rbx+r11*8-256] vfnmsub132sd xmm2{k5}, xmm7, xmm0 vfnmsub132sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmsub132sd xmm2{k5}, xmm7, [rbx] vfnmsub132sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub132sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub132sd xmm2{k5}{z}, xmm7, xmm0 vfnmsub132sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmsub132sd xmm2{k5}{z}, xmm7, [rbx] vfnmsub132sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub132sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub132ss xmm2, xmm7, xmm0 vfnmsub132ss xmm2, xmm7, xmm0, {rd-sae} vfnmsub132ss xmm2, xmm7, [rbx] vfnmsub132ss xmm2, xmm7, [rbx+r11*8+256] vfnmsub132ss xmm2, xmm7, [rbx+r11*8-256] vfnmsub132ss xmm2{k5}, xmm7, xmm0 vfnmsub132ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmsub132ss xmm2{k5}, xmm7, [rbx] vfnmsub132ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub132ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub132ss xmm2{k5}{z}, xmm7, xmm0 vfnmsub132ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmsub132ss xmm2{k5}{z}, xmm7, [rbx] vfnmsub132ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub132ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub213pd xmm2, xmm7, xmm0 vfnmsub213pd xmm2, xmm7, [rbx] vfnmsub213pd xmm2, xmm7, [rbx]{1to2} vfnmsub213pd xmm2, xmm7, [rbx+r11*8+256] vfnmsub213pd xmm2, xmm7, [rbx+r11*8-256] vfnmsub213pd xmm2{k5}, xmm7, xmm0 vfnmsub213pd xmm2{k5}, xmm7, [rbx] vfnmsub213pd xmm2{k5}, xmm7, [rbx]{1to2} vfnmsub213pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub213pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub213pd xmm2{k5}{z}, xmm7, xmm0 vfnmsub213pd xmm2{k5}{z}, xmm7, [rbx] vfnmsub213pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfnmsub213pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub213pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub213pd ymm16, ymm13, ymm15 vfnmsub213pd ymm16, ymm13, [rbx] vfnmsub213pd ymm16, ymm13, [rbx]{1to4} vfnmsub213pd ymm16, ymm13, [rbx+r11*8+256] vfnmsub213pd ymm16, ymm13, [rbx+r11*8-256] vfnmsub213pd ymm16{k5}, ymm13, ymm15 vfnmsub213pd ymm16{k5}, ymm13, [rbx] vfnmsub213pd ymm16{k5}, ymm13, [rbx]{1to4} vfnmsub213pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmsub213pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmsub213pd ymm16{k5}{z}, ymm13, ymm15 vfnmsub213pd ymm16{k5}{z}, ymm13, [rbx] vfnmsub213pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfnmsub213pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmsub213pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmsub213pd zmm24, zmm24, zmm31 vfnmsub213pd zmm24, zmm24, zmm31, {rd-sae} vfnmsub213pd zmm24, zmm24, [rbx] vfnmsub213pd zmm24, zmm24, [rbx]{1to8} vfnmsub213pd zmm24, zmm24, [rbx+r11*8+256] vfnmsub213pd zmm24, zmm24, [rbx+r11*8-256] vfnmsub213pd zmm24{k5}, zmm24, zmm31 vfnmsub213pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmsub213pd zmm24{k5}, zmm24, [rbx] vfnmsub213pd zmm24{k5}, zmm24, [rbx]{1to8} vfnmsub213pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmsub213pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmsub213pd zmm24{k5}{z}, zmm24, zmm31 vfnmsub213pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmsub213pd zmm24{k5}{z}, zmm24, [rbx] vfnmsub213pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfnmsub213pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmsub213pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmsub213ps xmm2, xmm7, xmm0 vfnmsub213ps xmm2, xmm7, [rbx] vfnmsub213ps xmm2, xmm7, [rbx]{1to4} vfnmsub213ps xmm2, xmm7, [rbx+r11*8+256] vfnmsub213ps xmm2, xmm7, [rbx+r11*8-256] vfnmsub213ps xmm2{k5}, xmm7, xmm0 vfnmsub213ps xmm2{k5}, xmm7, [rbx] vfnmsub213ps xmm2{k5}, xmm7, [rbx]{1to4} vfnmsub213ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub213ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub213ps xmm2{k5}{z}, xmm7, xmm0 vfnmsub213ps xmm2{k5}{z}, xmm7, [rbx] vfnmsub213ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfnmsub213ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub213ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub213ps ymm16, ymm13, ymm15 vfnmsub213ps ymm16, ymm13, [rbx] vfnmsub213ps ymm16, ymm13, [rbx]{1to8} vfnmsub213ps ymm16, ymm13, [rbx+r11*8+256] vfnmsub213ps ymm16, ymm13, [rbx+r11*8-256] vfnmsub213ps ymm16{k5}, ymm13, ymm15 vfnmsub213ps ymm16{k5}, ymm13, [rbx] vfnmsub213ps ymm16{k5}, ymm13, [rbx]{1to8} vfnmsub213ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmsub213ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmsub213ps ymm16{k5}{z}, ymm13, ymm15 vfnmsub213ps ymm16{k5}{z}, ymm13, [rbx] vfnmsub213ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfnmsub213ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmsub213ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmsub213ps zmm24, zmm24, zmm31 vfnmsub213ps zmm24, zmm24, zmm31, {rd-sae} vfnmsub213ps zmm24, zmm24, [rbx] vfnmsub213ps zmm24, zmm24, [rbx]{1to16} vfnmsub213ps zmm24, zmm24, [rbx+r11*8+256] vfnmsub213ps zmm24, zmm24, [rbx+r11*8-256] vfnmsub213ps zmm24{k5}, zmm24, zmm31 vfnmsub213ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmsub213ps zmm24{k5}, zmm24, [rbx] vfnmsub213ps zmm24{k5}, zmm24, [rbx]{1to16} vfnmsub213ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmsub213ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmsub213ps zmm24{k5}{z}, zmm24, zmm31 vfnmsub213ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmsub213ps zmm24{k5}{z}, zmm24, [rbx] vfnmsub213ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfnmsub213ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmsub213ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmsub213sd xmm2, xmm7, xmm0 vfnmsub213sd xmm2, xmm7, xmm0, {rd-sae} vfnmsub213sd xmm2, xmm7, [rbx] vfnmsub213sd xmm2, xmm7, [rbx+r11*8+256] vfnmsub213sd xmm2, xmm7, [rbx+r11*8-256] vfnmsub213sd xmm2{k5}, xmm7, xmm0 vfnmsub213sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmsub213sd xmm2{k5}, xmm7, [rbx] vfnmsub213sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub213sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub213sd xmm2{k5}{z}, xmm7, xmm0 vfnmsub213sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmsub213sd xmm2{k5}{z}, xmm7, [rbx] vfnmsub213sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub213sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub213ss xmm2, xmm7, xmm0 vfnmsub213ss xmm2, xmm7, xmm0, {rd-sae} vfnmsub213ss xmm2, xmm7, [rbx] vfnmsub213ss xmm2, xmm7, [rbx+r11*8+256] vfnmsub213ss xmm2, xmm7, [rbx+r11*8-256] vfnmsub213ss xmm2{k5}, xmm7, xmm0 vfnmsub213ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmsub213ss xmm2{k5}, xmm7, [rbx] vfnmsub213ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub213ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub213ss xmm2{k5}{z}, xmm7, xmm0 vfnmsub213ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmsub213ss xmm2{k5}{z}, xmm7, [rbx] vfnmsub213ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub213ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub231pd xmm2, xmm7, xmm0 vfnmsub231pd xmm2, xmm7, [rbx] vfnmsub231pd xmm2, xmm7, [rbx]{1to2} vfnmsub231pd xmm2, xmm7, [rbx+r11*8+256] vfnmsub231pd xmm2, xmm7, [rbx+r11*8-256] vfnmsub231pd xmm2{k5}, xmm7, xmm0 vfnmsub231pd xmm2{k5}, xmm7, [rbx] vfnmsub231pd xmm2{k5}, xmm7, [rbx]{1to2} vfnmsub231pd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub231pd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub231pd xmm2{k5}{z}, xmm7, xmm0 vfnmsub231pd xmm2{k5}{z}, xmm7, [rbx] vfnmsub231pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vfnmsub231pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub231pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub231pd ymm16, ymm13, ymm15 vfnmsub231pd ymm16, ymm13, [rbx] vfnmsub231pd ymm16, ymm13, [rbx]{1to4} vfnmsub231pd ymm16, ymm13, [rbx+r11*8+256] vfnmsub231pd ymm16, ymm13, [rbx+r11*8-256] vfnmsub231pd ymm16{k5}, ymm13, ymm15 vfnmsub231pd ymm16{k5}, ymm13, [rbx] vfnmsub231pd ymm16{k5}, ymm13, [rbx]{1to4} vfnmsub231pd ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmsub231pd ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmsub231pd ymm16{k5}{z}, ymm13, ymm15 vfnmsub231pd ymm16{k5}{z}, ymm13, [rbx] vfnmsub231pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vfnmsub231pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmsub231pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmsub231pd zmm24, zmm24, zmm31 vfnmsub231pd zmm24, zmm24, zmm31, {rd-sae} vfnmsub231pd zmm24, zmm24, [rbx] vfnmsub231pd zmm24, zmm24, [rbx]{1to8} vfnmsub231pd zmm24, zmm24, [rbx+r11*8+256] vfnmsub231pd zmm24, zmm24, [rbx+r11*8-256] vfnmsub231pd zmm24{k5}, zmm24, zmm31 vfnmsub231pd zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmsub231pd zmm24{k5}, zmm24, [rbx] vfnmsub231pd zmm24{k5}, zmm24, [rbx]{1to8} vfnmsub231pd zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmsub231pd zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmsub231pd zmm24{k5}{z}, zmm24, zmm31 vfnmsub231pd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmsub231pd zmm24{k5}{z}, zmm24, [rbx] vfnmsub231pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vfnmsub231pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmsub231pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmsub231ps xmm2, xmm7, xmm0 vfnmsub231ps xmm2, xmm7, [rbx] vfnmsub231ps xmm2, xmm7, [rbx]{1to4} vfnmsub231ps xmm2, xmm7, [rbx+r11*8+256] vfnmsub231ps xmm2, xmm7, [rbx+r11*8-256] vfnmsub231ps xmm2{k5}, xmm7, xmm0 vfnmsub231ps xmm2{k5}, xmm7, [rbx] vfnmsub231ps xmm2{k5}, xmm7, [rbx]{1to4} vfnmsub231ps xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub231ps xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub231ps xmm2{k5}{z}, xmm7, xmm0 vfnmsub231ps xmm2{k5}{z}, xmm7, [rbx] vfnmsub231ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vfnmsub231ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub231ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub231ps ymm16, ymm13, ymm15 vfnmsub231ps ymm16, ymm13, [rbx] vfnmsub231ps ymm16, ymm13, [rbx]{1to8} vfnmsub231ps ymm16, ymm13, [rbx+r11*8+256] vfnmsub231ps ymm16, ymm13, [rbx+r11*8-256] vfnmsub231ps ymm16{k5}, ymm13, ymm15 vfnmsub231ps ymm16{k5}, ymm13, [rbx] vfnmsub231ps ymm16{k5}, ymm13, [rbx]{1to8} vfnmsub231ps ymm16{k5}, ymm13, [rbx+r11*8+256] vfnmsub231ps ymm16{k5}, ymm13, [rbx+r11*8-256] vfnmsub231ps ymm16{k5}{z}, ymm13, ymm15 vfnmsub231ps ymm16{k5}{z}, ymm13, [rbx] vfnmsub231ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vfnmsub231ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vfnmsub231ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vfnmsub231ps zmm24, zmm24, zmm31 vfnmsub231ps zmm24, zmm24, zmm31, {rd-sae} vfnmsub231ps zmm24, zmm24, [rbx] vfnmsub231ps zmm24, zmm24, [rbx]{1to16} vfnmsub231ps zmm24, zmm24, [rbx+r11*8+256] vfnmsub231ps zmm24, zmm24, [rbx+r11*8-256] vfnmsub231ps zmm24{k5}, zmm24, zmm31 vfnmsub231ps zmm24{k5}, zmm24, zmm31, {rd-sae} vfnmsub231ps zmm24{k5}, zmm24, [rbx] vfnmsub231ps zmm24{k5}, zmm24, [rbx]{1to16} vfnmsub231ps zmm24{k5}, zmm24, [rbx+r11*8+256] vfnmsub231ps zmm24{k5}, zmm24, [rbx+r11*8-256] vfnmsub231ps zmm24{k5}{z}, zmm24, zmm31 vfnmsub231ps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vfnmsub231ps zmm24{k5}{z}, zmm24, [rbx] vfnmsub231ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vfnmsub231ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vfnmsub231ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vfnmsub231sd xmm2, xmm7, xmm0 vfnmsub231sd xmm2, xmm7, xmm0, {rd-sae} vfnmsub231sd xmm2, xmm7, [rbx] vfnmsub231sd xmm2, xmm7, [rbx+r11*8+256] vfnmsub231sd xmm2, xmm7, [rbx+r11*8-256] vfnmsub231sd xmm2{k5}, xmm7, xmm0 vfnmsub231sd xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmsub231sd xmm2{k5}, xmm7, [rbx] vfnmsub231sd xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub231sd xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub231sd xmm2{k5}{z}, xmm7, xmm0 vfnmsub231sd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmsub231sd xmm2{k5}{z}, xmm7, [rbx] vfnmsub231sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub231sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vfnmsub231ss xmm2, xmm7, xmm0 vfnmsub231ss xmm2, xmm7, xmm0, {rd-sae} vfnmsub231ss xmm2, xmm7, [rbx] vfnmsub231ss xmm2, xmm7, [rbx+r11*8+256] vfnmsub231ss xmm2, xmm7, [rbx+r11*8-256] vfnmsub231ss xmm2{k5}, xmm7, xmm0 vfnmsub231ss xmm2{k5}, xmm7, xmm0, {rd-sae} vfnmsub231ss xmm2{k5}, xmm7, [rbx] vfnmsub231ss xmm2{k5}, xmm7, [rbx+r11*8+256] vfnmsub231ss xmm2{k5}, xmm7, [rbx+r11*8-256] vfnmsub231ss xmm2{k5}{z}, xmm7, xmm0 vfnmsub231ss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vfnmsub231ss xmm2{k5}{z}, xmm7, [rbx] vfnmsub231ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vfnmsub231ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vgetexppd xmm2, xmm0 vgetexppd xmm2, [rbx] vgetexppd xmm2, [rbx]{1to2} vgetexppd xmm2, [rbx+r11*8+256] vgetexppd xmm2, [rbx+r11*8-256] vgetexppd xmm2{k5}, xmm0 vgetexppd xmm2{k5}, [rbx] vgetexppd xmm2{k5}, [rbx]{1to2} vgetexppd xmm2{k5}, [rbx+r11*8+256] vgetexppd xmm2{k5}, [rbx+r11*8-256] vgetexppd xmm2{k5}{z}, xmm0 vgetexppd xmm2{k5}{z}, [rbx] vgetexppd xmm2{k5}{z}, [rbx]{1to2} vgetexppd xmm2{k5}{z}, [rbx+r11*8+256] vgetexppd xmm2{k5}{z}, [rbx+r11*8-256] vgetexppd ymm16, ymm15 vgetexppd ymm16, [rbx] vgetexppd ymm16, [rbx]{1to4} vgetexppd ymm16, [rbx+r11*8+256] vgetexppd ymm16, [rbx+r11*8-256] vgetexppd ymm16{k5}, ymm15 vgetexppd ymm16{k5}, [rbx] vgetexppd ymm16{k5}, [rbx]{1to4} vgetexppd ymm16{k5}, [rbx+r11*8+256] vgetexppd ymm16{k5}, [rbx+r11*8-256] vgetexppd ymm16{k5}{z}, ymm15 vgetexppd ymm16{k5}{z}, [rbx] vgetexppd ymm16{k5}{z}, [rbx]{1to4} vgetexppd ymm16{k5}{z}, [rbx+r11*8+256] vgetexppd ymm16{k5}{z}, [rbx+r11*8-256] vgetexppd zmm24, zmm31 vgetexppd zmm24, zmm31, {sae} vgetexppd zmm24, [rbx] vgetexppd zmm24, [rbx]{1to8} vgetexppd zmm24, [rbx+r11*8+256] vgetexppd zmm24, [rbx+r11*8-256] vgetexppd zmm24{k5}, zmm31 vgetexppd zmm24{k5}, zmm31, {sae} vgetexppd zmm24{k5}, [rbx] vgetexppd zmm24{k5}, [rbx]{1to8} vgetexppd zmm24{k5}, [rbx+r11*8+256] vgetexppd zmm24{k5}, [rbx+r11*8-256] vgetexppd zmm24{k5}{z}, zmm31 vgetexppd zmm24{k5}{z}, zmm31, {sae} vgetexppd zmm24{k5}{z}, [rbx] vgetexppd zmm24{k5}{z}, [rbx]{1to8} vgetexppd zmm24{k5}{z}, [rbx+r11*8+256] vgetexppd zmm24{k5}{z}, [rbx+r11*8-256] vgetexpps xmm2, xmm0 vgetexpps xmm2, [rbx] vgetexpps xmm2, [rbx]{1to4} vgetexpps xmm2, [rbx+r11*8+256] vgetexpps xmm2, [rbx+r11*8-256] vgetexpps xmm2{k5}, xmm0 vgetexpps xmm2{k5}, [rbx] vgetexpps xmm2{k5}, [rbx]{1to4} vgetexpps xmm2{k5}, [rbx+r11*8+256] vgetexpps xmm2{k5}, [rbx+r11*8-256] vgetexpps xmm2{k5}{z}, xmm0 vgetexpps xmm2{k5}{z}, [rbx] vgetexpps xmm2{k5}{z}, [rbx]{1to4} vgetexpps xmm2{k5}{z}, [rbx+r11*8+256] vgetexpps xmm2{k5}{z}, [rbx+r11*8-256] vgetexpps ymm16, ymm15 vgetexpps ymm16, [rbx] vgetexpps ymm16, [rbx]{1to8} vgetexpps ymm16, [rbx+r11*8+256] vgetexpps ymm16, [rbx+r11*8-256] vgetexpps ymm16{k5}, ymm15 vgetexpps ymm16{k5}, [rbx] vgetexpps ymm16{k5}, [rbx]{1to8} vgetexpps ymm16{k5}, [rbx+r11*8+256] vgetexpps ymm16{k5}, [rbx+r11*8-256] vgetexpps ymm16{k5}{z}, ymm15 vgetexpps ymm16{k5}{z}, [rbx] vgetexpps ymm16{k5}{z}, [rbx]{1to8} vgetexpps ymm16{k5}{z}, [rbx+r11*8+256] vgetexpps ymm16{k5}{z}, [rbx+r11*8-256] vgetexpps zmm24, zmm31 vgetexpps zmm24, zmm31, {sae} vgetexpps zmm24, [rbx] vgetexpps zmm24, [rbx]{1to16} vgetexpps zmm24, [rbx+r11*8+256] vgetexpps zmm24, [rbx+r11*8-256] vgetexpps zmm24{k5}, zmm31 vgetexpps zmm24{k5}, zmm31, {sae} vgetexpps zmm24{k5}, [rbx] vgetexpps zmm24{k5}, [rbx]{1to16} vgetexpps zmm24{k5}, [rbx+r11*8+256] vgetexpps zmm24{k5}, [rbx+r11*8-256] vgetexpps zmm24{k5}{z}, zmm31 vgetexpps zmm24{k5}{z}, zmm31, {sae} vgetexpps zmm24{k5}{z}, [rbx] vgetexpps zmm24{k5}{z}, [rbx]{1to16} vgetexpps zmm24{k5}{z}, [rbx+r11*8+256] vgetexpps zmm24{k5}{z}, [rbx+r11*8-256] vgetexpsd xmm2, xmm7, xmm0 vgetexpsd xmm2, xmm7, xmm0, {sae} vgetexpsd xmm2, xmm7, [rbx] vgetexpsd xmm2, xmm7, [rbx+r11*8+256] vgetexpsd xmm2, xmm7, [rbx+r11*8-256] vgetexpsd xmm2{k5}, xmm7, xmm0 vgetexpsd xmm2{k5}, xmm7, xmm0, {sae} vgetexpsd xmm2{k5}, xmm7, [rbx] vgetexpsd xmm2{k5}, xmm7, [rbx+r11*8+256] vgetexpsd xmm2{k5}, xmm7, [rbx+r11*8-256] vgetexpsd xmm2{k5}{z}, xmm7, xmm0 vgetexpsd xmm2{k5}{z}, xmm7, xmm0, {sae} vgetexpsd xmm2{k5}{z}, xmm7, [rbx] vgetexpsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vgetexpsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vgetexpss xmm2, xmm7, xmm0 vgetexpss xmm2, xmm7, xmm0, {sae} vgetexpss xmm2, xmm7, [rbx] vgetexpss xmm2, xmm7, [rbx+r11*8+256] vgetexpss xmm2, xmm7, [rbx+r11*8-256] vgetexpss xmm2{k5}, xmm7, xmm0 vgetexpss xmm2{k5}, xmm7, xmm0, {sae} vgetexpss xmm2{k5}, xmm7, [rbx] vgetexpss xmm2{k5}, xmm7, [rbx+r11*8+256] vgetexpss xmm2{k5}, xmm7, [rbx+r11*8-256] vgetexpss xmm2{k5}{z}, xmm7, xmm0 vgetexpss xmm2{k5}{z}, xmm7, xmm0, {sae} vgetexpss xmm2{k5}{z}, xmm7, [rbx] vgetexpss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vgetexpss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vgetmantpd xmm2, xmm0, 10 vgetmantpd xmm2, [rbx], 10 vgetmantpd xmm2, [rbx]{1to2}, 10 vgetmantpd xmm2, [rbx+r11*8+256], 10 vgetmantpd xmm2, [rbx+r11*8-256], 10 vgetmantpd xmm2{k5}, xmm0, 10 vgetmantpd xmm2{k5}, [rbx], 10 vgetmantpd xmm2{k5}, [rbx]{1to2}, 10 vgetmantpd xmm2{k5}, [rbx+r11*8+256], 10 vgetmantpd xmm2{k5}, [rbx+r11*8-256], 10 vgetmantpd xmm2{k5}{z}, xmm0, 10 vgetmantpd xmm2{k5}{z}, [rbx], 10 vgetmantpd xmm2{k5}{z}, [rbx]{1to2}, 10 vgetmantpd xmm2{k5}{z}, [rbx+r11*8+256], 10 vgetmantpd xmm2{k5}{z}, [rbx+r11*8-256], 10 vgetmantpd ymm16, ymm15, 10 vgetmantpd ymm16, [rbx], 10 vgetmantpd ymm16, [rbx]{1to4}, 10 vgetmantpd ymm16, [rbx+r11*8+256], 10 vgetmantpd ymm16, [rbx+r11*8-256], 10 vgetmantpd ymm16{k5}, ymm15, 10 vgetmantpd ymm16{k5}, [rbx], 10 vgetmantpd ymm16{k5}, [rbx]{1to4}, 10 vgetmantpd ymm16{k5}, [rbx+r11*8+256], 10 vgetmantpd ymm16{k5}, [rbx+r11*8-256], 10 vgetmantpd ymm16{k5}{z}, ymm15, 10 vgetmantpd ymm16{k5}{z}, [rbx], 10 vgetmantpd ymm16{k5}{z}, [rbx]{1to4}, 10 vgetmantpd ymm16{k5}{z}, [rbx+r11*8+256], 10 vgetmantpd ymm16{k5}{z}, [rbx+r11*8-256], 10 vgetmantpd zmm24, zmm31, 10 vgetmantpd zmm24, [rbx], 10 vgetmantpd zmm24, [rbx]{1to8}, 10 vgetmantpd zmm24, [rbx+r11*8+256], 10 vgetmantpd zmm24, [rbx+r11*8-256], 10 vgetmantpd zmm24{k5}, zmm31, 10 vgetmantpd zmm24{k5}, [rbx], 10 vgetmantpd zmm24{k5}, [rbx]{1to8}, 10 vgetmantpd zmm24{k5}, [rbx+r11*8+256], 10 vgetmantpd zmm24{k5}, [rbx+r11*8-256], 10 vgetmantpd zmm24{k5}{z}, zmm31, 10 vgetmantpd zmm24{k5}{z}, [rbx], 10 vgetmantpd zmm24{k5}{z}, [rbx]{1to8}, 10 vgetmantpd zmm24{k5}{z}, [rbx+r11*8+256], 10 vgetmantpd zmm24{k5}{z}, [rbx+r11*8-256], 10 vgetmantps xmm2, xmm0, 10 vgetmantps xmm2, [rbx], 10 vgetmantps xmm2, [rbx]{1to4}, 10 vgetmantps xmm2, [rbx+r11*8+256], 10 vgetmantps xmm2, [rbx+r11*8-256], 10 vgetmantps xmm2{k5}, xmm0, 10 vgetmantps xmm2{k5}, [rbx], 10 vgetmantps xmm2{k5}, [rbx]{1to4}, 10 vgetmantps xmm2{k5}, [rbx+r11*8+256], 10 vgetmantps xmm2{k5}, [rbx+r11*8-256], 10 vgetmantps xmm2{k5}{z}, xmm0, 10 vgetmantps xmm2{k5}{z}, [rbx], 10 vgetmantps xmm2{k5}{z}, [rbx]{1to4}, 10 vgetmantps xmm2{k5}{z}, [rbx+r11*8+256], 10 vgetmantps xmm2{k5}{z}, [rbx+r11*8-256], 10 vgetmantps ymm16, ymm15, 10 vgetmantps ymm16, [rbx], 10 vgetmantps ymm16, [rbx]{1to8}, 10 vgetmantps ymm16, [rbx+r11*8+256], 10 vgetmantps ymm16, [rbx+r11*8-256], 10 vgetmantps ymm16{k5}, ymm15, 10 vgetmantps ymm16{k5}, [rbx], 10 vgetmantps ymm16{k5}, [rbx]{1to8}, 10 vgetmantps ymm16{k5}, [rbx+r11*8+256], 10 vgetmantps ymm16{k5}, [rbx+r11*8-256], 10 vgetmantps ymm16{k5}{z}, ymm15, 10 vgetmantps ymm16{k5}{z}, [rbx], 10 vgetmantps ymm16{k5}{z}, [rbx]{1to8}, 10 vgetmantps ymm16{k5}{z}, [rbx+r11*8+256], 10 vgetmantps ymm16{k5}{z}, [rbx+r11*8-256], 10 vgetmantps zmm24, zmm31, 10 vgetmantps zmm24, [rbx], 10 vgetmantps zmm24, [rbx]{1to16}, 10 vgetmantps zmm24, [rbx+r11*8+256], 10 vgetmantps zmm24, [rbx+r11*8-256], 10 vgetmantps zmm24{k5}, zmm31, 10 vgetmantps zmm24{k5}, [rbx], 10 vgetmantps zmm24{k5}, [rbx]{1to16}, 10 vgetmantps zmm24{k5}, [rbx+r11*8+256], 10 vgetmantps zmm24{k5}, [rbx+r11*8-256], 10 vgetmantps zmm24{k5}{z}, zmm31, 10 vgetmantps zmm24{k5}{z}, [rbx], 10 vgetmantps zmm24{k5}{z}, [rbx]{1to16}, 10 vgetmantps zmm24{k5}{z}, [rbx+r11*8+256], 10 vgetmantps zmm24{k5}{z}, [rbx+r11*8-256], 10 vgetmantsd xmm2, xmm7, xmm0, 10 vgetmantsd xmm2, xmm7, [rbx], 10 vgetmantsd xmm2, xmm7, [rbx+r11*8+256], 10 vgetmantsd xmm2, xmm7, [rbx+r11*8-256], 10 vgetmantsd xmm2{k5}, xmm7, xmm0, 10 vgetmantsd xmm2{k5}, xmm7, [rbx], 10 vgetmantsd xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vgetmantsd xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vgetmantsd xmm2{k5}{z}, xmm7, xmm0, 10 vgetmantsd xmm2{k5}{z}, xmm7, [rbx], 10 vgetmantsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vgetmantsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vgetmantss xmm2, xmm7, xmm0, 10 vgetmantss xmm2, xmm7, [rbx], 10 vgetmantss xmm2, xmm7, [rbx+r11*8+256], 10 vgetmantss xmm2, xmm7, [rbx+r11*8-256], 10 vgetmantss xmm2{k5}, xmm7, xmm0, 10 vgetmantss xmm2{k5}, xmm7, [rbx], 10 vgetmantss xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vgetmantss xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vgetmantss xmm2{k5}{z}, xmm7, xmm0, 10 vgetmantss xmm2{k5}{z}, xmm7, [rbx], 10 vgetmantss xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vgetmantss xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vinsertf32x4 ymm16, ymm13, xmm0, 10 vinsertf32x4 ymm16, ymm13, [rbx], 10 vinsertf32x4 ymm16, ymm13, [rbx+r11*8+256], 10 vinsertf32x4 ymm16, ymm13, [rbx+r11*8-256], 10 vinsertf32x4 ymm16{k5}, ymm13, xmm0, 10 vinsertf32x4 ymm16{k5}, ymm13, [rbx], 10 vinsertf32x4 ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vinsertf32x4 ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vinsertf32x4 ymm16{k5}{z}, ymm13, xmm0, 10 vinsertf32x4 ymm16{k5}{z}, ymm13, [rbx], 10 vinsertf32x4 ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vinsertf32x4 ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vinsertf32x4 zmm24, zmm24, xmm0, 10 vinsertf32x4 zmm24, zmm24, [rbx], 10 vinsertf32x4 zmm24, zmm24, [rbx+r11*8+256], 10 vinsertf32x4 zmm24, zmm24, [rbx+r11*8-256], 10 vinsertf32x4 zmm24{k5}, zmm24, xmm0, 10 vinsertf32x4 zmm24{k5}, zmm24, [rbx], 10 vinsertf32x4 zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vinsertf32x4 zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vinsertf32x4 zmm24{k5}{z}, zmm24, xmm0, 10 vinsertf32x4 zmm24{k5}{z}, zmm24, [rbx], 10 vinsertf32x4 zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vinsertf32x4 zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vinsertf64x4 zmm24, zmm24, ymm15, 10 vinsertf64x4 zmm24, zmm24, [rbx], 10 vinsertf64x4 zmm24, zmm24, [rbx+r11*8+256], 10 vinsertf64x4 zmm24, zmm24, [rbx+r11*8-256], 10 vinsertf64x4 zmm24{k5}, zmm24, ymm15, 10 vinsertf64x4 zmm24{k5}, zmm24, [rbx], 10 vinsertf64x4 zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vinsertf64x4 zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vinsertf64x4 zmm24{k5}{z}, zmm24, ymm15, 10 vinsertf64x4 zmm24{k5}{z}, zmm24, [rbx], 10 vinsertf64x4 zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vinsertf64x4 zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vinserti32x4 ymm16, ymm13, xmm0, 10 vinserti32x4 ymm16, ymm13, [rbx], 10 vinserti32x4 ymm16, ymm13, [rbx+r11*8+256], 10 vinserti32x4 ymm16, ymm13, [rbx+r11*8-256], 10 vinserti32x4 ymm16{k5}, ymm13, xmm0, 10 vinserti32x4 ymm16{k5}, ymm13, [rbx], 10 vinserti32x4 ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vinserti32x4 ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vinserti32x4 ymm16{k5}{z}, ymm13, xmm0, 10 vinserti32x4 ymm16{k5}{z}, ymm13, [rbx], 10 vinserti32x4 ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vinserti32x4 ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vinserti32x4 zmm24, zmm24, xmm0, 10 vinserti32x4 zmm24, zmm24, [rbx], 10 vinserti32x4 zmm24, zmm24, [rbx+r11*8+256], 10 vinserti32x4 zmm24, zmm24, [rbx+r11*8-256], 10 vinserti32x4 zmm24{k5}, zmm24, xmm0, 10 vinserti32x4 zmm24{k5}, zmm24, [rbx], 10 vinserti32x4 zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vinserti32x4 zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vinserti32x4 zmm24{k5}{z}, zmm24, xmm0, 10 vinserti32x4 zmm24{k5}{z}, zmm24, [rbx], 10 vinserti32x4 zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vinserti32x4 zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vinserti64x4 zmm24, zmm24, ymm15, 10 vinserti64x4 zmm24, zmm24, [rbx], 10 vinserti64x4 zmm24, zmm24, [rbx+r11*8+256], 10 vinserti64x4 zmm24, zmm24, [rbx+r11*8-256], 10 vinserti64x4 zmm24{k5}, zmm24, ymm15, 10 vinserti64x4 zmm24{k5}, zmm24, [rbx], 10 vinserti64x4 zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vinserti64x4 zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vinserti64x4 zmm24{k5}{z}, zmm24, ymm15, 10 vinserti64x4 zmm24{k5}{z}, zmm24, [rbx], 10 vinserti64x4 zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vinserti64x4 zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vinsertps xmm2, xmm7, [rbx], 10 vinsertps xmm2, xmm7, [rbx+rsi*8+256], 10 vinsertps xmm2, xmm7, [rbx+rsi*8-256], 10 vinsertps xmm2, xmm7, xmm0, 10 vmaxpd xmm2, xmm7, xmm0 vmaxpd xmm2, xmm7, [rbx] vmaxpd xmm2, xmm7, [rbx]{1to2} vmaxpd xmm2, xmm7, [rbx+r11*8+256] vmaxpd xmm2, xmm7, [rbx+r11*8-256] vmaxpd xmm2{k5}, xmm7, xmm0 vmaxpd xmm2{k5}, xmm7, [rbx] vmaxpd xmm2{k5}, xmm7, [rbx]{1to2} vmaxpd xmm2{k5}, xmm7, [rbx+r11*8+256] vmaxpd xmm2{k5}, xmm7, [rbx+r11*8-256] vmaxpd xmm2{k5}{z}, xmm7, xmm0 vmaxpd xmm2{k5}{z}, xmm7, [rbx] vmaxpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vmaxpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vmaxpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vmaxpd ymm16, ymm13, ymm15 vmaxpd ymm16, ymm13, [rbx] vmaxpd ymm16, ymm13, [rbx]{1to4} vmaxpd ymm16, ymm13, [rbx+r11*8+256] vmaxpd ymm16, ymm13, [rbx+r11*8-256] vmaxpd ymm16{k5}, ymm13, ymm15 vmaxpd ymm16{k5}, ymm13, [rbx] vmaxpd ymm16{k5}, ymm13, [rbx]{1to4} vmaxpd ymm16{k5}, ymm13, [rbx+r11*8+256] vmaxpd ymm16{k5}, ymm13, [rbx+r11*8-256] vmaxpd ymm16{k5}{z}, ymm13, ymm15 vmaxpd ymm16{k5}{z}, ymm13, [rbx] vmaxpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vmaxpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vmaxpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vmaxpd zmm24, zmm24, zmm31 vmaxpd zmm24, zmm24, zmm31, {sae} vmaxpd zmm24, zmm24, [rbx] vmaxpd zmm24, zmm24, [rbx]{1to8} vmaxpd zmm24, zmm24, [rbx+r11*8+256] vmaxpd zmm24, zmm24, [rbx+r11*8-256] vmaxpd zmm24{k5}, zmm24, zmm31 vmaxpd zmm24{k5}, zmm24, zmm31, {sae} vmaxpd zmm24{k5}, zmm24, [rbx] vmaxpd zmm24{k5}, zmm24, [rbx]{1to8} vmaxpd zmm24{k5}, zmm24, [rbx+r11*8+256] vmaxpd zmm24{k5}, zmm24, [rbx+r11*8-256] vmaxpd zmm24{k5}{z}, zmm24, zmm31 vmaxpd zmm24{k5}{z}, zmm24, zmm31, {sae} vmaxpd zmm24{k5}{z}, zmm24, [rbx] vmaxpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vmaxpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vmaxpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vmaxps xmm2, xmm7, xmm0 vmaxps xmm2, xmm7, [rbx] vmaxps xmm2, xmm7, [rbx]{1to4} vmaxps xmm2, xmm7, [rbx+r11*8+256] vmaxps xmm2, xmm7, [rbx+r11*8-256] vmaxps xmm2{k5}, xmm7, xmm0 vmaxps xmm2{k5}, xmm7, [rbx] vmaxps xmm2{k5}, xmm7, [rbx]{1to4} vmaxps xmm2{k5}, xmm7, [rbx+r11*8+256] vmaxps xmm2{k5}, xmm7, [rbx+r11*8-256] vmaxps xmm2{k5}{z}, xmm7, xmm0 vmaxps xmm2{k5}{z}, xmm7, [rbx] vmaxps xmm2{k5}{z}, xmm7, [rbx]{1to4} vmaxps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vmaxps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vmaxps ymm16, ymm13, ymm15 vmaxps ymm16, ymm13, [rbx] vmaxps ymm16, ymm13, [rbx]{1to8} vmaxps ymm16, ymm13, [rbx+r11*8+256] vmaxps ymm16, ymm13, [rbx+r11*8-256] vmaxps ymm16{k5}, ymm13, ymm15 vmaxps ymm16{k5}, ymm13, [rbx] vmaxps ymm16{k5}, ymm13, [rbx]{1to8} vmaxps ymm16{k5}, ymm13, [rbx+r11*8+256] vmaxps ymm16{k5}, ymm13, [rbx+r11*8-256] vmaxps ymm16{k5}{z}, ymm13, ymm15 vmaxps ymm16{k5}{z}, ymm13, [rbx] vmaxps ymm16{k5}{z}, ymm13, [rbx]{1to8} vmaxps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vmaxps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vmaxps zmm24, zmm24, zmm31 vmaxps zmm24, zmm24, zmm31, {sae} vmaxps zmm24, zmm24, [rbx] vmaxps zmm24, zmm24, [rbx]{1to16} vmaxps zmm24, zmm24, [rbx+r11*8+256] vmaxps zmm24, zmm24, [rbx+r11*8-256] vmaxps zmm24{k5}, zmm24, zmm31 vmaxps zmm24{k5}, zmm24, zmm31, {sae} vmaxps zmm24{k5}, zmm24, [rbx] vmaxps zmm24{k5}, zmm24, [rbx]{1to16} vmaxps zmm24{k5}, zmm24, [rbx+r11*8+256] vmaxps zmm24{k5}, zmm24, [rbx+r11*8-256] vmaxps zmm24{k5}{z}, zmm24, zmm31 vmaxps zmm24{k5}{z}, zmm24, zmm31, {sae} vmaxps zmm24{k5}{z}, zmm24, [rbx] vmaxps zmm24{k5}{z}, zmm24, [rbx]{1to16} vmaxps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vmaxps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vmaxsd xmm2, xmm7, xmm0 vmaxsd xmm2, xmm7, xmm0, {sae} vmaxsd xmm2, xmm7, [rbx] vmaxsd xmm2, xmm7, [rbx+r11*8+256] vmaxsd xmm2, xmm7, [rbx+r11*8-256] vmaxsd xmm2{k5}, xmm7, xmm0 vmaxsd xmm2{k5}, xmm7, xmm0, {sae} vmaxsd xmm2{k5}, xmm7, [rbx] vmaxsd xmm2{k5}, xmm7, [rbx+r11*8+256] vmaxsd xmm2{k5}, xmm7, [rbx+r11*8-256] vmaxsd xmm2{k5}{z}, xmm7, xmm0 vmaxsd xmm2{k5}{z}, xmm7, xmm0, {sae} vmaxsd xmm2{k5}{z}, xmm7, [rbx] vmaxsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vmaxsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vmaxss xmm2, xmm7, xmm0 vmaxss xmm2, xmm7, xmm0, {sae} vmaxss xmm2, xmm7, [rbx] vmaxss xmm2, xmm7, [rbx+r11*8+256] vmaxss xmm2, xmm7, [rbx+r11*8-256] vmaxss xmm2{k5}, xmm7, xmm0 vmaxss xmm2{k5}, xmm7, xmm0, {sae} vmaxss xmm2{k5}, xmm7, [rbx] vmaxss xmm2{k5}, xmm7, [rbx+r11*8+256] vmaxss xmm2{k5}, xmm7, [rbx+r11*8-256] vmaxss xmm2{k5}{z}, xmm7, xmm0 vmaxss xmm2{k5}{z}, xmm7, xmm0, {sae} vmaxss xmm2{k5}{z}, xmm7, [rbx] vmaxss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vmaxss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vminpd xmm2, xmm7, xmm0 vminpd xmm2, xmm7, [rbx] vminpd xmm2, xmm7, [rbx]{1to2} vminpd xmm2, xmm7, [rbx+r11*8+256] vminpd xmm2, xmm7, [rbx+r11*8-256] vminpd xmm2{k5}, xmm7, xmm0 vminpd xmm2{k5}, xmm7, [rbx] vminpd xmm2{k5}, xmm7, [rbx]{1to2} vminpd xmm2{k5}, xmm7, [rbx+r11*8+256] vminpd xmm2{k5}, xmm7, [rbx+r11*8-256] vminpd xmm2{k5}{z}, xmm7, xmm0 vminpd xmm2{k5}{z}, xmm7, [rbx] vminpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vminpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vminpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vminpd ymm16, ymm13, ymm15 vminpd ymm16, ymm13, [rbx] vminpd ymm16, ymm13, [rbx]{1to4} vminpd ymm16, ymm13, [rbx+r11*8+256] vminpd ymm16, ymm13, [rbx+r11*8-256] vminpd ymm16{k5}, ymm13, ymm15 vminpd ymm16{k5}, ymm13, [rbx] vminpd ymm16{k5}, ymm13, [rbx]{1to4} vminpd ymm16{k5}, ymm13, [rbx+r11*8+256] vminpd ymm16{k5}, ymm13, [rbx+r11*8-256] vminpd ymm16{k5}{z}, ymm13, ymm15 vminpd ymm16{k5}{z}, ymm13, [rbx] vminpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vminpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vminpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vminpd zmm24, zmm24, zmm31 vminpd zmm24, zmm24, zmm31, {sae} vminpd zmm24, zmm24, [rbx] vminpd zmm24, zmm24, [rbx]{1to8} vminpd zmm24, zmm24, [rbx+r11*8+256] vminpd zmm24, zmm24, [rbx+r11*8-256] vminpd zmm24{k5}, zmm24, zmm31 vminpd zmm24{k5}, zmm24, zmm31, {sae} vminpd zmm24{k5}, zmm24, [rbx] vminpd zmm24{k5}, zmm24, [rbx]{1to8} vminpd zmm24{k5}, zmm24, [rbx+r11*8+256] vminpd zmm24{k5}, zmm24, [rbx+r11*8-256] vminpd zmm24{k5}{z}, zmm24, zmm31 vminpd zmm24{k5}{z}, zmm24, zmm31, {sae} vminpd zmm24{k5}{z}, zmm24, [rbx] vminpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vminpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vminpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vminps xmm2, xmm7, xmm0 vminps xmm2, xmm7, [rbx] vminps xmm2, xmm7, [rbx]{1to4} vminps xmm2, xmm7, [rbx+r11*8+256] vminps xmm2, xmm7, [rbx+r11*8-256] vminps xmm2{k5}, xmm7, xmm0 vminps xmm2{k5}, xmm7, [rbx] vminps xmm2{k5}, xmm7, [rbx]{1to4} vminps xmm2{k5}, xmm7, [rbx+r11*8+256] vminps xmm2{k5}, xmm7, [rbx+r11*8-256] vminps xmm2{k5}{z}, xmm7, xmm0 vminps xmm2{k5}{z}, xmm7, [rbx] vminps xmm2{k5}{z}, xmm7, [rbx]{1to4} vminps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vminps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vminps ymm16, ymm13, ymm15 vminps ymm16, ymm13, [rbx] vminps ymm16, ymm13, [rbx]{1to8} vminps ymm16, ymm13, [rbx+r11*8+256] vminps ymm16, ymm13, [rbx+r11*8-256] vminps ymm16{k5}, ymm13, ymm15 vminps ymm16{k5}, ymm13, [rbx] vminps ymm16{k5}, ymm13, [rbx]{1to8} vminps ymm16{k5}, ymm13, [rbx+r11*8+256] vminps ymm16{k5}, ymm13, [rbx+r11*8-256] vminps ymm16{k5}{z}, ymm13, ymm15 vminps ymm16{k5}{z}, ymm13, [rbx] vminps ymm16{k5}{z}, ymm13, [rbx]{1to8} vminps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vminps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vminps zmm24, zmm24, zmm31 vminps zmm24, zmm24, zmm31, {sae} vminps zmm24, zmm24, [rbx] vminps zmm24, zmm24, [rbx]{1to16} vminps zmm24, zmm24, [rbx+r11*8+256] vminps zmm24, zmm24, [rbx+r11*8-256] vminps zmm24{k5}, zmm24, zmm31 vminps zmm24{k5}, zmm24, zmm31, {sae} vminps zmm24{k5}, zmm24, [rbx] vminps zmm24{k5}, zmm24, [rbx]{1to16} vminps zmm24{k5}, zmm24, [rbx+r11*8+256] vminps zmm24{k5}, zmm24, [rbx+r11*8-256] vminps zmm24{k5}{z}, zmm24, zmm31 vminps zmm24{k5}{z}, zmm24, zmm31, {sae} vminps zmm24{k5}{z}, zmm24, [rbx] vminps zmm24{k5}{z}, zmm24, [rbx]{1to16} vminps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vminps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vminsd xmm2, xmm7, xmm0 vminsd xmm2, xmm7, xmm0, {sae} vminsd xmm2, xmm7, [rbx] vminsd xmm2, xmm7, [rbx+r11*8+256] vminsd xmm2, xmm7, [rbx+r11*8-256] vminsd xmm2{k5}, xmm7, xmm0 vminsd xmm2{k5}, xmm7, xmm0, {sae} vminsd xmm2{k5}, xmm7, [rbx] vminsd xmm2{k5}, xmm7, [rbx+r11*8+256] vminsd xmm2{k5}, xmm7, [rbx+r11*8-256] vminsd xmm2{k5}{z}, xmm7, xmm0 vminsd xmm2{k5}{z}, xmm7, xmm0, {sae} vminsd xmm2{k5}{z}, xmm7, [rbx] vminsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vminsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vminss xmm2, xmm7, xmm0 vminss xmm2, xmm7, xmm0, {sae} vminss xmm2, xmm7, [rbx] vminss xmm2, xmm7, [rbx+r11*8+256] vminss xmm2, xmm7, [rbx+r11*8-256] vminss xmm2{k5}, xmm7, xmm0 vminss xmm2{k5}, xmm7, xmm0, {sae} vminss xmm2{k5}, xmm7, [rbx] vminss xmm2{k5}, xmm7, [rbx+r11*8+256] vminss xmm2{k5}, xmm7, [rbx+r11*8-256] vminss xmm2{k5}{z}, xmm7, xmm0 vminss xmm2{k5}{z}, xmm7, xmm0, {sae} vminss xmm2{k5}{z}, xmm7, [rbx] vminss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vminss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vmovapd xmm2, xmm0 vmovapd xmm2, [rbx] vmovapd xmm2, [rbx+r11*8+256] vmovapd xmm2, [rbx+r11*8-256] vmovapd xmm2{k5}, xmm0 vmovapd xmm2{k5}, [rbx] vmovapd xmm2{k5}, [rbx+r11*8+256] vmovapd xmm2{k5}, [rbx+r11*8-256] vmovapd xmm2{k5}{z}, xmm0 vmovapd xmm2{k5}{z}, [rbx] vmovapd xmm2{k5}{z}, [rbx+r11*8+256] vmovapd xmm2{k5}{z}, [rbx+r11*8-256] vmovapd ymm16, ymm15 vmovapd ymm16, [rbx] vmovapd ymm16, [rbx+r11*8+256] vmovapd ymm16, [rbx+r11*8-256] vmovapd ymm16{k5}, ymm15 vmovapd ymm16{k5}, [rbx] vmovapd ymm16{k5}, [rbx+r11*8+256] vmovapd ymm16{k5}, [rbx+r11*8-256] vmovapd ymm16{k5}{z}, ymm15 vmovapd ymm16{k5}{z}, [rbx] vmovapd ymm16{k5}{z}, [rbx+r11*8+256] vmovapd ymm16{k5}{z}, [rbx+r11*8-256] vmovapd zmm24, zmm31 vmovapd zmm24, [rbx] vmovapd zmm24, [rbx+r11*8+256] vmovapd zmm24, [rbx+r11*8-256] vmovapd zmm24{k5}, zmm31 vmovapd zmm24{k5}, [rbx] vmovapd zmm24{k5}, [rbx+r11*8+256] vmovapd zmm24{k5}, [rbx+r11*8-256] vmovapd zmm24{k5}{z}, zmm31 vmovapd zmm24{k5}{z}, [rbx] vmovapd zmm24{k5}{z}, [rbx+r11*8+256] vmovapd zmm24{k5}{z}, [rbx+r11*8-256] vmovapd xmm0, xmm2 vmovapd ymm15, ymm16 vmovapd zmm31, zmm24 vmovapd [rbx], xmm2 vmovapd [rbx], ymm16 vmovapd [rbx], zmm24 vmovapd [rbx+r11*8+256], xmm2 vmovapd [rbx+r11*8+256], ymm16 vmovapd [rbx+r11*8+256], zmm24 vmovapd [rbx+r11*8-256], xmm2 vmovapd [rbx+r11*8-256], ymm16 vmovapd [rbx+r11*8-256], zmm24 vmovaps xmm2, xmm0 vmovaps xmm2, [rbx] vmovaps xmm2, [rbx+r11*8+256] vmovaps xmm2, [rbx+r11*8-256] vmovaps xmm2{k5}, xmm0 vmovaps xmm2{k5}, [rbx] vmovaps xmm2{k5}, [rbx+r11*8+256] vmovaps xmm2{k5}, [rbx+r11*8-256] vmovaps xmm2{k5}{z}, xmm0 vmovaps xmm2{k5}{z}, [rbx] vmovaps xmm2{k5}{z}, [rbx+r11*8+256] vmovaps xmm2{k5}{z}, [rbx+r11*8-256] vmovaps ymm16, ymm15 vmovaps ymm16, [rbx] vmovaps ymm16, [rbx+r11*8+256] vmovaps ymm16, [rbx+r11*8-256] vmovaps ymm16{k5}, ymm15 vmovaps ymm16{k5}, [rbx] vmovaps ymm16{k5}, [rbx+r11*8+256] vmovaps ymm16{k5}, [rbx+r11*8-256] vmovaps ymm16{k5}{z}, ymm15 vmovaps ymm16{k5}{z}, [rbx] vmovaps ymm16{k5}{z}, [rbx+r11*8+256] vmovaps ymm16{k5}{z}, [rbx+r11*8-256] vmovaps zmm24, zmm31 vmovaps zmm24, [rbx] vmovaps zmm24, [rbx+r11*8+256] vmovaps zmm24, [rbx+r11*8-256] vmovaps zmm24{k5}, zmm31 vmovaps zmm24{k5}, [rbx] vmovaps zmm24{k5}, [rbx+r11*8+256] vmovaps zmm24{k5}, [rbx+r11*8-256] vmovaps zmm24{k5}{z}, zmm31 vmovaps zmm24{k5}{z}, [rbx] vmovaps zmm24{k5}{z}, [rbx+r11*8+256] vmovaps zmm24{k5}{z}, [rbx+r11*8-256] vmovaps xmm0, xmm2 vmovaps ymm15, ymm16 vmovaps zmm31, zmm24 vmovaps [rbx], xmm2 vmovaps [rbx], ymm16 vmovaps [rbx], zmm24 vmovaps [rbx+r11*8+256], xmm2 vmovaps [rbx+r11*8+256], ymm16 vmovaps [rbx+r11*8+256], zmm24 vmovaps [rbx+r11*8-256], xmm2 vmovaps [rbx+r11*8-256], ymm16 vmovaps [rbx+r11*8-256], zmm24 vmovd xmm2, ecx vmovd xmm2, [rbx] vmovd xmm2, [rbx+rsi*8+256] vmovd ecx, xmm2 vmovd [rbx], xmm2 vmovd [rbx+rsi*8+256], xmm2 vmovddup xmm2, xmm0 vmovddup xmm2, [rbx] vmovddup xmm2, [rbx+r11*8+256] vmovddup xmm2, [rbx+r11*8-256] vmovddup xmm2{k5}, xmm0 vmovddup xmm2{k5}, [rbx] vmovddup xmm2{k5}, [rbx+r11*8+256] vmovddup xmm2{k5}, [rbx+r11*8-256] vmovddup xmm2{k5}{z}, xmm0 vmovddup xmm2{k5}{z}, [rbx] vmovddup xmm2{k5}{z}, [rbx+r11*8+256] vmovddup xmm2{k5}{z}, [rbx+r11*8-256] vmovddup ymm16, ymm15 vmovddup ymm16, [rbx] vmovddup ymm16, [rbx+r11*8+256] vmovddup ymm16, [rbx+r11*8-256] vmovddup ymm16{k5}, ymm15 vmovddup ymm16{k5}, [rbx] vmovddup ymm16{k5}, [rbx+r11*8+256] vmovddup ymm16{k5}, [rbx+r11*8-256] vmovddup ymm16{k5}{z}, ymm15 vmovddup ymm16{k5}{z}, [rbx] vmovddup ymm16{k5}{z}, [rbx+r11*8+256] vmovddup ymm16{k5}{z}, [rbx+r11*8-256] vmovddup zmm24, zmm31 vmovddup zmm24, [rbx] vmovddup zmm24, [rbx+r11*8+256] vmovddup zmm24, [rbx+r11*8-256] vmovddup zmm24{k5}, zmm31 vmovddup zmm24{k5}, [rbx] vmovddup zmm24{k5}, [rbx+r11*8+256] vmovddup zmm24{k5}, [rbx+r11*8-256] vmovddup zmm24{k5}{z}, zmm31 vmovddup zmm24{k5}{z}, [rbx] vmovddup zmm24{k5}{z}, [rbx+r11*8+256] vmovddup zmm24{k5}{z}, [rbx+r11*8-256] vmovddup xmm2, xmm0 vmovddup xmm2, [rbx] vmovddup xmm2, [rbx+r11*8+256] vmovddup xmm2, [rbx+r11*8-256] vmovddup xmm2{k5}, xmm0 vmovddup xmm2{k5}, [rbx] vmovddup xmm2{k5}, [rbx+r11*8+256] vmovddup xmm2{k5}, [rbx+r11*8-256] vmovddup xmm2{k5}{z}, xmm0 vmovddup xmm2{k5}{z}, [rbx] vmovddup xmm2{k5}{z}, [rbx+r11*8+256] vmovddup xmm2{k5}{z}, [rbx+r11*8-256] vmovddup ymm16, ymm15 vmovddup ymm16, [rbx] vmovddup ymm16, [rbx+r11*8+256] vmovddup ymm16, [rbx+r11*8-256] vmovddup ymm16{k5}, ymm15 vmovddup ymm16{k5}, [rbx] vmovddup ymm16{k5}, [rbx+r11*8+256] vmovddup ymm16{k5}, [rbx+r11*8-256] vmovddup ymm16{k5}{z}, ymm15 vmovddup ymm16{k5}{z}, [rbx] vmovddup ymm16{k5}{z}, [rbx+r11*8+256] vmovddup ymm16{k5}{z}, [rbx+r11*8-256] vmovddup zmm24, zmm31 vmovddup zmm24, [rbx] vmovddup zmm24, [rbx+r11*8+256] vmovddup zmm24, [rbx+r11*8-256] vmovddup zmm24{k5}, zmm31 vmovddup zmm24{k5}, [rbx] vmovddup zmm24{k5}, [rbx+r11*8+256] vmovddup zmm24{k5}, [rbx+r11*8-256] vmovddup zmm24{k5}{z}, zmm31 vmovddup zmm24{k5}{z}, [rbx] vmovddup zmm24{k5}{z}, [rbx+r11*8+256] vmovddup zmm24{k5}{z}, [rbx+r11*8-256] vmovddup xmm2, xmm0 vmovddup xmm2, [rbx] vmovddup xmm2, [rbx+r11*8+256] vmovddup xmm2, [rbx+r11*8-256] vmovddup xmm2{k5}, xmm0 vmovddup xmm2{k5}, [rbx] vmovddup xmm2{k5}, [rbx+r11*8+256] vmovddup xmm2{k5}, [rbx+r11*8-256] vmovddup xmm2{k5}{z}, xmm0 vmovddup xmm2{k5}{z}, [rbx] vmovddup xmm2{k5}{z}, [rbx+r11*8+256] vmovddup xmm2{k5}{z}, [rbx+r11*8-256] vmovddup ymm16, ymm15 vmovddup ymm16, [rbx] vmovddup ymm16, [rbx+r11*8+256] vmovddup ymm16, [rbx+r11*8-256] vmovddup ymm16{k5}, ymm15 vmovddup ymm16{k5}, [rbx] vmovddup ymm16{k5}, [rbx+r11*8+256] vmovddup ymm16{k5}, [rbx+r11*8-256] vmovddup ymm16{k5}{z}, ymm15 vmovddup ymm16{k5}{z}, [rbx] vmovddup ymm16{k5}{z}, [rbx+r11*8+256] vmovddup ymm16{k5}{z}, [rbx+r11*8-256] vmovddup zmm24, zmm31 vmovddup zmm24, [rbx] vmovddup zmm24, [rbx+r11*8+256] vmovddup zmm24, [rbx+r11*8-256] vmovddup zmm24{k5}, zmm31 vmovddup zmm24{k5}, [rbx] vmovddup zmm24{k5}, [rbx+r11*8+256] vmovddup zmm24{k5}, [rbx+r11*8-256] vmovddup zmm24{k5}{z}, zmm31 vmovddup zmm24{k5}{z}, [rbx] vmovddup zmm24{k5}{z}, [rbx+r11*8+256] vmovddup zmm24{k5}{z}, [rbx+r11*8-256] vmovdqa32 xmm2, xmm0 vmovdqa32 xmm2, [rbx] vmovdqa32 xmm2, [rbx+r11*8+256] vmovdqa32 xmm2, [rbx+r11*8-256] vmovdqa32 xmm2{k5}, xmm0 vmovdqa32 xmm2{k5}, [rbx] vmovdqa32 xmm2{k5}, [rbx+r11*8+256] vmovdqa32 xmm2{k5}, [rbx+r11*8-256] vmovdqa32 xmm2{k5}{z}, xmm0 vmovdqa32 xmm2{k5}{z}, [rbx] vmovdqa32 xmm2{k5}{z}, [rbx+r11*8+256] vmovdqa32 xmm2{k5}{z}, [rbx+r11*8-256] vmovdqa32 ymm16, ymm15 vmovdqa32 ymm16, [rbx] vmovdqa32 ymm16, [rbx+r11*8+256] vmovdqa32 ymm16, [rbx+r11*8-256] vmovdqa32 ymm16{k5}, ymm15 vmovdqa32 ymm16{k5}, [rbx] vmovdqa32 ymm16{k5}, [rbx+r11*8+256] vmovdqa32 ymm16{k5}, [rbx+r11*8-256] vmovdqa32 ymm16{k5}{z}, ymm15 vmovdqa32 ymm16{k5}{z}, [rbx] vmovdqa32 ymm16{k5}{z}, [rbx+r11*8+256] vmovdqa32 ymm16{k5}{z}, [rbx+r11*8-256] vmovdqa32 zmm24, zmm31 vmovdqa32 zmm24, [rbx] vmovdqa32 zmm24, [rbx+r11*8+256] vmovdqa32 zmm24, [rbx+r11*8-256] vmovdqa32 zmm24{k5}, zmm31 vmovdqa32 zmm24{k5}, [rbx] vmovdqa32 zmm24{k5}, [rbx+r11*8+256] vmovdqa32 zmm24{k5}, [rbx+r11*8-256] vmovdqa32 zmm24{k5}{z}, zmm31 vmovdqa32 zmm24{k5}{z}, [rbx] vmovdqa32 zmm24{k5}{z}, [rbx+r11*8+256] vmovdqa32 zmm24{k5}{z}, [rbx+r11*8-256] vmovdqa32 xmm0, xmm2 vmovdqa32 ymm15, ymm16 vmovdqa32 zmm31, zmm24 vmovdqa32 [rbx], xmm2 vmovdqa32 [rbx], ymm16 vmovdqa32 [rbx], zmm24 vmovdqa32 [rbx+r11*8+256], xmm2 vmovdqa32 [rbx+r11*8+256], ymm16 vmovdqa32 [rbx+r11*8+256], zmm24 vmovdqa32 [rbx+r11*8-256], xmm2 vmovdqa32 [rbx+r11*8-256], ymm16 vmovdqa32 [rbx+r11*8-256], zmm24 vmovdqa64 xmm2, xmm0 vmovdqa64 xmm2, [rbx] vmovdqa64 xmm2, [rbx+r11*8+256] vmovdqa64 xmm2, [rbx+r11*8-256] vmovdqa64 xmm2{k5}, xmm0 vmovdqa64 xmm2{k5}, [rbx] vmovdqa64 xmm2{k5}, [rbx+r11*8+256] vmovdqa64 xmm2{k5}, [rbx+r11*8-256] vmovdqa64 xmm2{k5}{z}, xmm0 vmovdqa64 xmm2{k5}{z}, [rbx] vmovdqa64 xmm2{k5}{z}, [rbx+r11*8+256] vmovdqa64 xmm2{k5}{z}, [rbx+r11*8-256] vmovdqa64 ymm16, ymm15 vmovdqa64 ymm16, [rbx] vmovdqa64 ymm16, [rbx+r11*8+256] vmovdqa64 ymm16, [rbx+r11*8-256] vmovdqa64 ymm16{k5}, ymm15 vmovdqa64 ymm16{k5}, [rbx] vmovdqa64 ymm16{k5}, [rbx+r11*8+256] vmovdqa64 ymm16{k5}, [rbx+r11*8-256] vmovdqa64 ymm16{k5}{z}, ymm15 vmovdqa64 ymm16{k5}{z}, [rbx] vmovdqa64 ymm16{k5}{z}, [rbx+r11*8+256] vmovdqa64 ymm16{k5}{z}, [rbx+r11*8-256] vmovdqa64 zmm24, zmm31 vmovdqa64 zmm24, [rbx] vmovdqa64 zmm24, [rbx+r11*8+256] vmovdqa64 zmm24, [rbx+r11*8-256] vmovdqa64 zmm24{k5}, zmm31 vmovdqa64 zmm24{k5}, [rbx] vmovdqa64 zmm24{k5}, [rbx+r11*8+256] vmovdqa64 zmm24{k5}, [rbx+r11*8-256] vmovdqa64 zmm24{k5}{z}, zmm31 vmovdqa64 zmm24{k5}{z}, [rbx] vmovdqa64 zmm24{k5}{z}, [rbx+r11*8+256] vmovdqa64 zmm24{k5}{z}, [rbx+r11*8-256] vmovdqa64 xmm0, xmm2 vmovdqa64 ymm15, ymm16 vmovdqa64 zmm31, zmm24 vmovdqa64 [rbx], xmm2 vmovdqa64 [rbx], ymm16 vmovdqa64 [rbx], zmm24 vmovdqa64 [rbx+r11*8+256], xmm2 vmovdqa64 [rbx+r11*8+256], ymm16 vmovdqa64 [rbx+r11*8+256], zmm24 vmovdqa64 [rbx+r11*8-256], xmm2 vmovdqa64 [rbx+r11*8-256], ymm16 vmovdqa64 [rbx+r11*8-256], zmm24 vmovdqu32 xmm2, xmm0 vmovdqu32 xmm2, [rbx] vmovdqu32 xmm2, [rbx+r11*8+256] vmovdqu32 xmm2, [rbx+r11*8-256] vmovdqu32 xmm2{k5}, xmm0 vmovdqu32 xmm2{k5}, [rbx] vmovdqu32 xmm2{k5}, [rbx+r11*8+256] vmovdqu32 xmm2{k5}, [rbx+r11*8-256] vmovdqu32 xmm2{k5}{z}, xmm0 vmovdqu32 xmm2{k5}{z}, [rbx] vmovdqu32 xmm2{k5}{z}, [rbx+r11*8+256] vmovdqu32 xmm2{k5}{z}, [rbx+r11*8-256] vmovdqu32 ymm16, ymm15 vmovdqu32 ymm16, [rbx] vmovdqu32 ymm16, [rbx+r11*8+256] vmovdqu32 ymm16, [rbx+r11*8-256] vmovdqu32 ymm16{k5}, ymm15 vmovdqu32 ymm16{k5}, [rbx] vmovdqu32 ymm16{k5}, [rbx+r11*8+256] vmovdqu32 ymm16{k5}, [rbx+r11*8-256] vmovdqu32 ymm16{k5}{z}, ymm15 vmovdqu32 ymm16{k5}{z}, [rbx] vmovdqu32 ymm16{k5}{z}, [rbx+r11*8+256] vmovdqu32 ymm16{k5}{z}, [rbx+r11*8-256] vmovdqu32 zmm24, zmm31 vmovdqu32 zmm24, [rbx] vmovdqu32 zmm24, [rbx+r11*8+256] vmovdqu32 zmm24, [rbx+r11*8-256] vmovdqu32 zmm24{k5}, zmm31 vmovdqu32 zmm24{k5}, [rbx] vmovdqu32 zmm24{k5}, [rbx+r11*8+256] vmovdqu32 zmm24{k5}, [rbx+r11*8-256] vmovdqu32 zmm24{k5}{z}, zmm31 vmovdqu32 zmm24{k5}{z}, [rbx] vmovdqu32 zmm24{k5}{z}, [rbx+r11*8+256] vmovdqu32 zmm24{k5}{z}, [rbx+r11*8-256] vmovdqu32 xmm0, xmm2 vmovdqu32 ymm15, ymm16 vmovdqu32 zmm31, zmm24 vmovdqu32 [rbx], xmm2 vmovdqu32 [rbx], ymm16 vmovdqu32 [rbx], zmm24 vmovdqu32 [rbx+r11*8+256], xmm2 vmovdqu32 [rbx+r11*8+256], ymm16 vmovdqu32 [rbx+r11*8+256], zmm24 vmovdqu32 [rbx+r11*8-256], xmm2 vmovdqu32 [rbx+r11*8-256], ymm16 vmovdqu32 [rbx+r11*8-256], zmm24 vmovdqu64 xmm2, xmm0 vmovdqu64 xmm2, [rbx] vmovdqu64 xmm2, [rbx+r11*8+256] vmovdqu64 xmm2, [rbx+r11*8-256] vmovdqu64 xmm2{k5}, xmm0 vmovdqu64 xmm2{k5}, [rbx] vmovdqu64 xmm2{k5}, [rbx+r11*8+256] vmovdqu64 xmm2{k5}, [rbx+r11*8-256] vmovdqu64 xmm2{k5}{z}, xmm0 vmovdqu64 xmm2{k5}{z}, [rbx] vmovdqu64 xmm2{k5}{z}, [rbx+r11*8+256] vmovdqu64 xmm2{k5}{z}, [rbx+r11*8-256] vmovdqu64 ymm16, ymm15 vmovdqu64 ymm16, [rbx] vmovdqu64 ymm16, [rbx+r11*8+256] vmovdqu64 ymm16, [rbx+r11*8-256] vmovdqu64 ymm16{k5}, ymm15 vmovdqu64 ymm16{k5}, [rbx] vmovdqu64 ymm16{k5}, [rbx+r11*8+256] vmovdqu64 ymm16{k5}, [rbx+r11*8-256] vmovdqu64 ymm16{k5}{z}, ymm15 vmovdqu64 ymm16{k5}{z}, [rbx] vmovdqu64 ymm16{k5}{z}, [rbx+r11*8+256] vmovdqu64 ymm16{k5}{z}, [rbx+r11*8-256] vmovdqu64 zmm24, zmm31 vmovdqu64 zmm24, [rbx] vmovdqu64 zmm24, [rbx+r11*8+256] vmovdqu64 zmm24, [rbx+r11*8-256] vmovdqu64 zmm24{k5}, zmm31 vmovdqu64 zmm24{k5}, [rbx] vmovdqu64 zmm24{k5}, [rbx+r11*8+256] vmovdqu64 zmm24{k5}, [rbx+r11*8-256] vmovdqu64 zmm24{k5}{z}, zmm31 vmovdqu64 zmm24{k5}{z}, [rbx] vmovdqu64 zmm24{k5}{z}, [rbx+r11*8+256] vmovdqu64 zmm24{k5}{z}, [rbx+r11*8-256] vmovdqu64 xmm0, xmm2 vmovdqu64 ymm15, ymm16 vmovdqu64 zmm31, zmm24 vmovdqu64 [rbx], xmm2 vmovdqu64 [rbx], ymm16 vmovdqu64 [rbx], zmm24 vmovdqu64 [rbx+r11*8+256], xmm2 vmovdqu64 [rbx+r11*8+256], ymm16 vmovdqu64 [rbx+r11*8+256], zmm24 vmovdqu64 [rbx+r11*8-256], xmm2 vmovdqu64 [rbx+r11*8-256], ymm16 vmovdqu64 [rbx+r11*8-256], zmm24 vmovhlps xmm2, xmm7, xmm0 vmovhpd xmm2, xmm7, [rbx] vmovhpd xmm2, xmm7, [rbx+rsi*8+256] vmovhpd xmm2, xmm7, [rbx+rsi*8-256] vmovhpd [rbx], xmm2 vmovhpd [rbx+rsi*8+256], xmm2 vmovhpd [rbx+rsi*8-256], xmm2 vmovhps xmm2, xmm7, [rbx] vmovhps xmm2, xmm7, [rbx+rsi*8+256] vmovhps xmm2, xmm7, [rbx+rsi*8-256] vmovhps [rbx], xmm2 vmovhps [rbx+rsi*8+256], xmm2 vmovhps [rbx+rsi*8-256], xmm2 vmovlhps xmm2, xmm7, xmm0 vmovlpd xmm2, xmm7, [rbx] vmovlpd xmm2, xmm7, [rbx+rsi*8+256] vmovlpd xmm2, xmm7, [rbx+rsi*8-256] vmovlpd [rbx], xmm2 vmovlpd [rbx+rsi*8+256], xmm2 vmovlpd [rbx+rsi*8-256], xmm2 vmovlps xmm2, xmm7, [rbx] vmovlps xmm2, xmm7, [rbx+rsi*8+256] vmovlps xmm2, xmm7, [rbx+rsi*8-256] vmovlps [rbx], xmm2 vmovlps [rbx+rsi*8+256], xmm2 vmovlps [rbx+rsi*8-256], xmm2 vmovntdq [rbx], xmm2 vmovntdq [rbx], ymm16 vmovntdq [rbx], zmm24 vmovntdq [rbx+rsi*8+256], xmm2 vmovntdq [rbx+rsi*8+256], ymm16 vmovntdq [rbx+rsi*8+256], zmm24 vmovntdq [rbx+rsi*8-256], xmm2 vmovntdq [rbx+rsi*8-256], ymm16 vmovntdq [rbx+rsi*8-256], zmm24 vmovntdqa xmm2, [rbx] vmovntdqa xmm2, [rbx+rsi*8+256] vmovntdqa xmm2, [rbx+rsi*8-256] vmovntdqa ymm16, [rbx] vmovntdqa ymm16, [rbx+rsi*8+256] vmovntdqa ymm16, [rbx+rsi*8-256] vmovntdqa zmm24, [rbx] vmovntdqa zmm24, [rbx+rsi*8+256] vmovntdqa zmm24, [rbx+rsi*8-256] vmovntpd [rbx], xmm2 vmovntpd [rbx], ymm16 vmovntpd [rbx], zmm24 vmovntpd [rbx+rsi*8+256], xmm2 vmovntpd [rbx+rsi*8+256], ymm16 vmovntpd [rbx+rsi*8+256], zmm24 vmovntpd [rbx+rsi*8-256], xmm2 vmovntpd [rbx+rsi*8-256], ymm16 vmovntpd [rbx+rsi*8-256], zmm24 vmovntps [rbx], xmm2 vmovntps [rbx], ymm16 vmovntps [rbx], zmm24 vmovntps [rbx+rsi*8+256], xmm2 vmovntps [rbx+rsi*8+256], ymm16 vmovntps [rbx+rsi*8+256], zmm24 vmovntps [rbx+rsi*8-256], xmm2 vmovntps [rbx+rsi*8-256], ymm16 vmovntps [rbx+rsi*8-256], zmm24 vmovq xmm2, rcx vmovq xmm2, [rbx] vmovq xmm2, [rbx+rsi*8+256] vmovq rcx, xmm2 vmovq [rbx], xmm2 vmovq [rbx+rsi*8+256], xmm2 vmovq xmm2, xmm0 vmovq xmm2, [rbx] vmovq xmm2, [rbx+r11*8+256] vmovq xmm2, [rbx+r11*8-256] vmovq xmm0, xmm2 vmovq [rbx], xmm2 vmovq [rbx+r11*8+256], xmm2 vmovq [rbx+r11*8-256], xmm2 vmovsd xmm2, [rbx] vmovsd xmm2, [rbx+rsi*8+256] vmovsd xmm2, [rbx+rsi*8-256] vmovsd xmm2{k5}, [rbx] vmovsd xmm2{k5}, [rbx+rsi*8+256] vmovsd xmm2{k5}, [rbx+rsi*8-256] vmovsd xmm2{k5}{z}, [rbx] vmovsd xmm2{k5}{z}, [rbx+rsi*8+256] vmovsd xmm2{k5}{z}, [rbx+rsi*8-256] vmovsd xmm2, xmm7, xmm0 vmovsd xmm2{k5}, xmm7, xmm0 vmovsd xmm2{k5}{z}, xmm7, xmm0 vmovsd [rbx], xmm2 vmovsd [rbx+rsi*8+256], xmm2 vmovsd [rbx+rsi*8-256], xmm2 vmovsd xmm0, xmm7, xmm2 vmovshdup xmm2, xmm0 vmovshdup xmm2, [rbx] vmovshdup xmm2, [rbx+r11*8+256] vmovshdup xmm2, [rbx+r11*8-256] vmovshdup xmm2{k5}, xmm0 vmovshdup xmm2{k5}, [rbx] vmovshdup xmm2{k5}, [rbx+r11*8+256] vmovshdup xmm2{k5}, [rbx+r11*8-256] vmovshdup xmm2{k5}{z}, xmm0 vmovshdup xmm2{k5}{z}, [rbx] vmovshdup xmm2{k5}{z}, [rbx+r11*8+256] vmovshdup xmm2{k5}{z}, [rbx+r11*8-256] vmovshdup ymm16, ymm15 vmovshdup ymm16, [rbx] vmovshdup ymm16, [rbx+r11*8+256] vmovshdup ymm16, [rbx+r11*8-256] vmovshdup ymm16{k5}, ymm15 vmovshdup ymm16{k5}, [rbx] vmovshdup ymm16{k5}, [rbx+r11*8+256] vmovshdup ymm16{k5}, [rbx+r11*8-256] vmovshdup ymm16{k5}{z}, ymm15 vmovshdup ymm16{k5}{z}, [rbx] vmovshdup ymm16{k5}{z}, [rbx+r11*8+256] vmovshdup ymm16{k5}{z}, [rbx+r11*8-256] vmovshdup zmm24, zmm31 vmovshdup zmm24, [rbx] vmovshdup zmm24, [rbx+r11*8+256] vmovshdup zmm24, [rbx+r11*8-256] vmovshdup zmm24{k5}, zmm31 vmovshdup zmm24{k5}, [rbx] vmovshdup zmm24{k5}, [rbx+r11*8+256] vmovshdup zmm24{k5}, [rbx+r11*8-256] vmovshdup zmm24{k5}{z}, zmm31 vmovshdup zmm24{k5}{z}, [rbx] vmovshdup zmm24{k5}{z}, [rbx+r11*8+256] vmovshdup zmm24{k5}{z}, [rbx+r11*8-256] vmovsldup xmm2, xmm0 vmovsldup xmm2, [rbx] vmovsldup xmm2, [rbx+r11*8+256] vmovsldup xmm2, [rbx+r11*8-256] vmovsldup xmm2{k5}, xmm0 vmovsldup xmm2{k5}, [rbx] vmovsldup xmm2{k5}, [rbx+r11*8+256] vmovsldup xmm2{k5}, [rbx+r11*8-256] vmovsldup xmm2{k5}{z}, xmm0 vmovsldup xmm2{k5}{z}, [rbx] vmovsldup xmm2{k5}{z}, [rbx+r11*8+256] vmovsldup xmm2{k5}{z}, [rbx+r11*8-256] vmovsldup ymm16, ymm15 vmovsldup ymm16, [rbx] vmovsldup ymm16, [rbx+r11*8+256] vmovsldup ymm16, [rbx+r11*8-256] vmovsldup ymm16{k5}, ymm15 vmovsldup ymm16{k5}, [rbx] vmovsldup ymm16{k5}, [rbx+r11*8+256] vmovsldup ymm16{k5}, [rbx+r11*8-256] vmovsldup ymm16{k5}{z}, ymm15 vmovsldup ymm16{k5}{z}, [rbx] vmovsldup ymm16{k5}{z}, [rbx+r11*8+256] vmovsldup ymm16{k5}{z}, [rbx+r11*8-256] vmovsldup zmm24, zmm31 vmovsldup zmm24, [rbx] vmovsldup zmm24, [rbx+r11*8+256] vmovsldup zmm24, [rbx+r11*8-256] vmovsldup zmm24{k5}, zmm31 vmovsldup zmm24{k5}, [rbx] vmovsldup zmm24{k5}, [rbx+r11*8+256] vmovsldup zmm24{k5}, [rbx+r11*8-256] vmovsldup zmm24{k5}{z}, zmm31 vmovsldup zmm24{k5}{z}, [rbx] vmovsldup zmm24{k5}{z}, [rbx+r11*8+256] vmovsldup zmm24{k5}{z}, [rbx+r11*8-256] vmovss xmm2, [rbx] vmovss xmm2, [rbx+rsi*8+256] vmovss xmm2, [rbx+rsi*8-256] vmovss xmm2{k5}, [rbx] vmovss xmm2{k5}, [rbx+rsi*8+256] vmovss xmm2{k5}, [rbx+rsi*8-256] vmovss xmm2{k5}{z}, [rbx] vmovss xmm2{k5}{z}, [rbx+rsi*8+256] vmovss xmm2{k5}{z}, [rbx+rsi*8-256] vmovss xmm2, xmm7, xmm0 vmovss xmm2{k5}, xmm7, xmm0 vmovss xmm2{k5}{z}, xmm7, xmm0 vmovss [rbx], xmm2 vmovss [rbx+rsi*8+256], xmm2 vmovss [rbx+rsi*8-256], xmm2 vmovss xmm0, xmm7, xmm2 vmovupd xmm2, xmm0 vmovupd xmm2, [rbx] vmovupd xmm2, [rbx+r11*8+256] vmovupd xmm2, [rbx+r11*8-256] vmovupd xmm2{k5}, xmm0 vmovupd xmm2{k5}, [rbx] vmovupd xmm2{k5}, [rbx+r11*8+256] vmovupd xmm2{k5}, [rbx+r11*8-256] vmovupd xmm2{k5}{z}, xmm0 vmovupd xmm2{k5}{z}, [rbx] vmovupd xmm2{k5}{z}, [rbx+r11*8+256] vmovupd xmm2{k5}{z}, [rbx+r11*8-256] vmovupd ymm16, ymm15 vmovupd ymm16, [rbx] vmovupd ymm16, [rbx+r11*8+256] vmovupd ymm16, [rbx+r11*8-256] vmovupd ymm16{k5}, ymm15 vmovupd ymm16{k5}, [rbx] vmovupd ymm16{k5}, [rbx+r11*8+256] vmovupd ymm16{k5}, [rbx+r11*8-256] vmovupd ymm16{k5}{z}, ymm15 vmovupd ymm16{k5}{z}, [rbx] vmovupd ymm16{k5}{z}, [rbx+r11*8+256] vmovupd ymm16{k5}{z}, [rbx+r11*8-256] vmovupd zmm24, zmm31 vmovupd zmm24, [rbx] vmovupd zmm24, [rbx+r11*8+256] vmovupd zmm24, [rbx+r11*8-256] vmovupd zmm24{k5}, zmm31 vmovupd zmm24{k5}, [rbx] vmovupd zmm24{k5}, [rbx+r11*8+256] vmovupd zmm24{k5}, [rbx+r11*8-256] vmovupd zmm24{k5}{z}, zmm31 vmovupd zmm24{k5}{z}, [rbx] vmovupd zmm24{k5}{z}, [rbx+r11*8+256] vmovupd zmm24{k5}{z}, [rbx+r11*8-256] vmovupd xmm0, xmm2 vmovupd ymm15, ymm16 vmovupd zmm31, zmm24 vmovupd [rbx], xmm2 vmovupd [rbx], ymm16 vmovupd [rbx], zmm24 vmovupd [rbx+r11*8+256], xmm2 vmovupd [rbx+r11*8+256], ymm16 vmovupd [rbx+r11*8+256], zmm24 vmovupd [rbx+r11*8-256], xmm2 vmovupd [rbx+r11*8-256], ymm16 vmovupd [rbx+r11*8-256], zmm24 vmovups xmm2, xmm0 vmovups xmm2, [rbx] vmovups xmm2, [rbx+r11*8+256] vmovups xmm2, [rbx+r11*8-256] vmovups xmm2{k5}, xmm0 vmovups xmm2{k5}, [rbx] vmovups xmm2{k5}, [rbx+r11*8+256] vmovups xmm2{k5}, [rbx+r11*8-256] vmovups xmm2{k5}{z}, xmm0 vmovups xmm2{k5}{z}, [rbx] vmovups xmm2{k5}{z}, [rbx+r11*8+256] vmovups xmm2{k5}{z}, [rbx+r11*8-256] vmovups ymm16, ymm15 vmovups ymm16, [rbx] vmovups ymm16, [rbx+r11*8+256] vmovups ymm16, [rbx+r11*8-256] vmovups ymm16{k5}, ymm15 vmovups ymm16{k5}, [rbx] vmovups ymm16{k5}, [rbx+r11*8+256] vmovups ymm16{k5}, [rbx+r11*8-256] vmovups ymm16{k5}{z}, ymm15 vmovups ymm16{k5}{z}, [rbx] vmovups ymm16{k5}{z}, [rbx+r11*8+256] vmovups ymm16{k5}{z}, [rbx+r11*8-256] vmovups zmm24, zmm31 vmovups zmm24, [rbx] vmovups zmm24, [rbx+r11*8+256] vmovups zmm24, [rbx+r11*8-256] vmovups zmm24{k5}, zmm31 vmovups zmm24{k5}, [rbx] vmovups zmm24{k5}, [rbx+r11*8+256] vmovups zmm24{k5}, [rbx+r11*8-256] vmovups zmm24{k5}{z}, zmm31 vmovups zmm24{k5}{z}, [rbx] vmovups zmm24{k5}{z}, [rbx+r11*8+256] vmovups zmm24{k5}{z}, [rbx+r11*8-256] vmovups xmm0, xmm2 vmovups ymm15, ymm16 vmovups zmm31, zmm24 vmovups [rbx], xmm2 vmovups [rbx], ymm16 vmovups [rbx], zmm24 vmovups [rbx+r11*8+256], xmm2 vmovups [rbx+r11*8+256], ymm16 vmovups [rbx+r11*8+256], zmm24 vmovups [rbx+r11*8-256], xmm2 vmovups [rbx+r11*8-256], ymm16 vmovups [rbx+r11*8-256], zmm24 vmulpd xmm2, xmm7, xmm0 vmulpd xmm2, xmm7, [rbx] vmulpd xmm2, xmm7, [rbx]{1to2} vmulpd xmm2, xmm7, [rbx+r11*8+256] vmulpd xmm2, xmm7, [rbx+r11*8-256] vmulpd xmm2{k5}, xmm7, xmm0 vmulpd xmm2{k5}, xmm7, [rbx] vmulpd xmm2{k5}, xmm7, [rbx]{1to2} vmulpd xmm2{k5}, xmm7, [rbx+r11*8+256] vmulpd xmm2{k5}, xmm7, [rbx+r11*8-256] vmulpd xmm2{k5}{z}, xmm7, xmm0 vmulpd xmm2{k5}{z}, xmm7, [rbx] vmulpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vmulpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vmulpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vmulpd ymm16, ymm13, ymm15 vmulpd ymm16, ymm13, [rbx] vmulpd ymm16, ymm13, [rbx]{1to4} vmulpd ymm16, ymm13, [rbx+r11*8+256] vmulpd ymm16, ymm13, [rbx+r11*8-256] vmulpd ymm16{k5}, ymm13, ymm15 vmulpd ymm16{k5}, ymm13, [rbx] vmulpd ymm16{k5}, ymm13, [rbx]{1to4} vmulpd ymm16{k5}, ymm13, [rbx+r11*8+256] vmulpd ymm16{k5}, ymm13, [rbx+r11*8-256] vmulpd ymm16{k5}{z}, ymm13, ymm15 vmulpd ymm16{k5}{z}, ymm13, [rbx] vmulpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vmulpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vmulpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vmulpd zmm24, zmm24, zmm31 vmulpd zmm24, zmm24, zmm31, {rd-sae} vmulpd zmm24, zmm24, [rbx] vmulpd zmm24, zmm24, [rbx]{1to8} vmulpd zmm24, zmm24, [rbx+r11*8+256] vmulpd zmm24, zmm24, [rbx+r11*8-256] vmulpd zmm24{k5}, zmm24, zmm31 vmulpd zmm24{k5}, zmm24, zmm31, {rd-sae} vmulpd zmm24{k5}, zmm24, [rbx] vmulpd zmm24{k5}, zmm24, [rbx]{1to8} vmulpd zmm24{k5}, zmm24, [rbx+r11*8+256] vmulpd zmm24{k5}, zmm24, [rbx+r11*8-256] vmulpd zmm24{k5}{z}, zmm24, zmm31 vmulpd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vmulpd zmm24{k5}{z}, zmm24, [rbx] vmulpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vmulpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vmulpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vmulps xmm2, xmm7, xmm0 vmulps xmm2, xmm7, [rbx] vmulps xmm2, xmm7, [rbx]{1to4} vmulps xmm2, xmm7, [rbx+r11*8+256] vmulps xmm2, xmm7, [rbx+r11*8-256] vmulps xmm2{k5}, xmm7, xmm0 vmulps xmm2{k5}, xmm7, [rbx] vmulps xmm2{k5}, xmm7, [rbx]{1to4} vmulps xmm2{k5}, xmm7, [rbx+r11*8+256] vmulps xmm2{k5}, xmm7, [rbx+r11*8-256] vmulps xmm2{k5}{z}, xmm7, xmm0 vmulps xmm2{k5}{z}, xmm7, [rbx] vmulps xmm2{k5}{z}, xmm7, [rbx]{1to4} vmulps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vmulps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vmulps ymm16, ymm13, ymm15 vmulps ymm16, ymm13, [rbx] vmulps ymm16, ymm13, [rbx]{1to8} vmulps ymm16, ymm13, [rbx+r11*8+256] vmulps ymm16, ymm13, [rbx+r11*8-256] vmulps ymm16{k5}, ymm13, ymm15 vmulps ymm16{k5}, ymm13, [rbx] vmulps ymm16{k5}, ymm13, [rbx]{1to8} vmulps ymm16{k5}, ymm13, [rbx+r11*8+256] vmulps ymm16{k5}, ymm13, [rbx+r11*8-256] vmulps ymm16{k5}{z}, ymm13, ymm15 vmulps ymm16{k5}{z}, ymm13, [rbx] vmulps ymm16{k5}{z}, ymm13, [rbx]{1to8} vmulps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vmulps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vmulps zmm24, zmm24, zmm31 vmulps zmm24, zmm24, zmm31, {rd-sae} vmulps zmm24, zmm24, [rbx] vmulps zmm24, zmm24, [rbx]{1to16} vmulps zmm24, zmm24, [rbx+r11*8+256] vmulps zmm24, zmm24, [rbx+r11*8-256] vmulps zmm24{k5}, zmm24, zmm31 vmulps zmm24{k5}, zmm24, zmm31, {rd-sae} vmulps zmm24{k5}, zmm24, [rbx] vmulps zmm24{k5}, zmm24, [rbx]{1to16} vmulps zmm24{k5}, zmm24, [rbx+r11*8+256] vmulps zmm24{k5}, zmm24, [rbx+r11*8-256] vmulps zmm24{k5}{z}, zmm24, zmm31 vmulps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vmulps zmm24{k5}{z}, zmm24, [rbx] vmulps zmm24{k5}{z}, zmm24, [rbx]{1to16} vmulps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vmulps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vmulsd xmm2, xmm7, xmm0 vmulsd xmm2, xmm7, xmm0, {rd-sae} vmulsd xmm2, xmm7, [rbx] vmulsd xmm2, xmm7, [rbx+r11*8+256] vmulsd xmm2, xmm7, [rbx+r11*8-256] vmulsd xmm2{k5}, xmm7, xmm0 vmulsd xmm2{k5}, xmm7, xmm0, {rd-sae} vmulsd xmm2{k5}, xmm7, [rbx] vmulsd xmm2{k5}, xmm7, [rbx+r11*8+256] vmulsd xmm2{k5}, xmm7, [rbx+r11*8-256] vmulsd xmm2{k5}{z}, xmm7, xmm0 vmulsd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vmulsd xmm2{k5}{z}, xmm7, [rbx] vmulsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vmulsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vmulss xmm2, xmm7, xmm0 vmulss xmm2, xmm7, xmm0, {rd-sae} vmulss xmm2, xmm7, [rbx] vmulss xmm2, xmm7, [rbx+r11*8+256] vmulss xmm2, xmm7, [rbx+r11*8-256] vmulss xmm2{k5}, xmm7, xmm0 vmulss xmm2{k5}, xmm7, xmm0, {rd-sae} vmulss xmm2{k5}, xmm7, [rbx] vmulss xmm2{k5}, xmm7, [rbx+r11*8+256] vmulss xmm2{k5}, xmm7, [rbx+r11*8-256] vmulss xmm2{k5}{z}, xmm7, xmm0 vmulss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vmulss xmm2{k5}{z}, xmm7, [rbx] vmulss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vmulss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpabsd xmm2, xmm0 vpabsd xmm2, [rbx] vpabsd xmm2, [rbx]{1to4} vpabsd xmm2, [rbx+r11*8+256] vpabsd xmm2, [rbx+r11*8-256] vpabsd xmm2{k5}, xmm0 vpabsd xmm2{k5}, [rbx] vpabsd xmm2{k5}, [rbx]{1to4} vpabsd xmm2{k5}, [rbx+r11*8+256] vpabsd xmm2{k5}, [rbx+r11*8-256] vpabsd xmm2{k5}{z}, xmm0 vpabsd xmm2{k5}{z}, [rbx] vpabsd xmm2{k5}{z}, [rbx]{1to4} vpabsd xmm2{k5}{z}, [rbx+r11*8+256] vpabsd xmm2{k5}{z}, [rbx+r11*8-256] vpabsd ymm16, ymm15 vpabsd ymm16, [rbx] vpabsd ymm16, [rbx]{1to8} vpabsd ymm16, [rbx+r11*8+256] vpabsd ymm16, [rbx+r11*8-256] vpabsd ymm16{k5}, ymm15 vpabsd ymm16{k5}, [rbx] vpabsd ymm16{k5}, [rbx]{1to8} vpabsd ymm16{k5}, [rbx+r11*8+256] vpabsd ymm16{k5}, [rbx+r11*8-256] vpabsd ymm16{k5}{z}, ymm15 vpabsd ymm16{k5}{z}, [rbx] vpabsd ymm16{k5}{z}, [rbx]{1to8} vpabsd ymm16{k5}{z}, [rbx+r11*8+256] vpabsd ymm16{k5}{z}, [rbx+r11*8-256] vpabsd zmm24, zmm31 vpabsd zmm24, [rbx] vpabsd zmm24, [rbx]{1to16} vpabsd zmm24, [rbx+r11*8+256] vpabsd zmm24, [rbx+r11*8-256] vpabsd zmm24{k5}, zmm31 vpabsd zmm24{k5}, [rbx] vpabsd zmm24{k5}, [rbx]{1to16} vpabsd zmm24{k5}, [rbx+r11*8+256] vpabsd zmm24{k5}, [rbx+r11*8-256] vpabsd zmm24{k5}{z}, zmm31 vpabsd zmm24{k5}{z}, [rbx] vpabsd zmm24{k5}{z}, [rbx]{1to16} vpabsd zmm24{k5}{z}, [rbx+r11*8+256] vpabsd zmm24{k5}{z}, [rbx+r11*8-256] vpabsq xmm2, xmm0 vpabsq xmm2, [rbx] vpabsq xmm2, [rbx]{1to2} vpabsq xmm2, [rbx+r11*8+256] vpabsq xmm2, [rbx+r11*8-256] vpabsq xmm2{k5}, xmm0 vpabsq xmm2{k5}, [rbx] vpabsq xmm2{k5}, [rbx]{1to2} vpabsq xmm2{k5}, [rbx+r11*8+256] vpabsq xmm2{k5}, [rbx+r11*8-256] vpabsq xmm2{k5}{z}, xmm0 vpabsq xmm2{k5}{z}, [rbx] vpabsq xmm2{k5}{z}, [rbx]{1to2} vpabsq xmm2{k5}{z}, [rbx+r11*8+256] vpabsq xmm2{k5}{z}, [rbx+r11*8-256] vpabsq ymm16, ymm15 vpabsq ymm16, [rbx] vpabsq ymm16, [rbx]{1to4} vpabsq ymm16, [rbx+r11*8+256] vpabsq ymm16, [rbx+r11*8-256] vpabsq ymm16{k5}, ymm15 vpabsq ymm16{k5}, [rbx] vpabsq ymm16{k5}, [rbx]{1to4} vpabsq ymm16{k5}, [rbx+r11*8+256] vpabsq ymm16{k5}, [rbx+r11*8-256] vpabsq ymm16{k5}{z}, ymm15 vpabsq ymm16{k5}{z}, [rbx] vpabsq ymm16{k5}{z}, [rbx]{1to4} vpabsq ymm16{k5}{z}, [rbx+r11*8+256] vpabsq ymm16{k5}{z}, [rbx+r11*8-256] vpabsq zmm24, zmm31 vpabsq zmm24, [rbx] vpabsq zmm24, [rbx]{1to8} vpabsq zmm24, [rbx+r11*8+256] vpabsq zmm24, [rbx+r11*8-256] vpabsq zmm24{k5}, zmm31 vpabsq zmm24{k5}, [rbx] vpabsq zmm24{k5}, [rbx]{1to8} vpabsq zmm24{k5}, [rbx+r11*8+256] vpabsq zmm24{k5}, [rbx+r11*8-256] vpabsq zmm24{k5}{z}, zmm31 vpabsq zmm24{k5}{z}, [rbx] vpabsq zmm24{k5}{z}, [rbx]{1to8} vpabsq zmm24{k5}{z}, [rbx+r11*8+256] vpabsq zmm24{k5}{z}, [rbx+r11*8-256] vpaddd xmm2, xmm7, xmm0 vpaddd xmm2, xmm7, [rbx] vpaddd xmm2, xmm7, [rbx]{1to4} vpaddd xmm2, xmm7, [rbx+r11*8+256] vpaddd xmm2, xmm7, [rbx+r11*8-256] vpaddd xmm2{k5}, xmm7, xmm0 vpaddd xmm2{k5}, xmm7, [rbx] vpaddd xmm2{k5}, xmm7, [rbx]{1to4} vpaddd xmm2{k5}, xmm7, [rbx+r11*8+256] vpaddd xmm2{k5}, xmm7, [rbx+r11*8-256] vpaddd xmm2{k5}{z}, xmm7, xmm0 vpaddd xmm2{k5}{z}, xmm7, [rbx] vpaddd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpaddd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpaddd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpaddd ymm16, ymm13, ymm15 vpaddd ymm16, ymm13, [rbx] vpaddd ymm16, ymm13, [rbx]{1to8} vpaddd ymm16, ymm13, [rbx+r11*8+256] vpaddd ymm16, ymm13, [rbx+r11*8-256] vpaddd ymm16{k5}, ymm13, ymm15 vpaddd ymm16{k5}, ymm13, [rbx] vpaddd ymm16{k5}, ymm13, [rbx]{1to8} vpaddd ymm16{k5}, ymm13, [rbx+r11*8+256] vpaddd ymm16{k5}, ymm13, [rbx+r11*8-256] vpaddd ymm16{k5}{z}, ymm13, ymm15 vpaddd ymm16{k5}{z}, ymm13, [rbx] vpaddd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpaddd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpaddd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpaddd zmm24, zmm24, zmm31 vpaddd zmm24, zmm24, [rbx] vpaddd zmm24, zmm24, [rbx]{1to16} vpaddd zmm24, zmm24, [rbx+r11*8+256] vpaddd zmm24, zmm24, [rbx+r11*8-256] vpaddd zmm24{k5}, zmm24, zmm31 vpaddd zmm24{k5}, zmm24, [rbx] vpaddd zmm24{k5}, zmm24, [rbx]{1to16} vpaddd zmm24{k5}, zmm24, [rbx+r11*8+256] vpaddd zmm24{k5}, zmm24, [rbx+r11*8-256] vpaddd zmm24{k5}{z}, zmm24, zmm31 vpaddd zmm24{k5}{z}, zmm24, [rbx] vpaddd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpaddd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpaddd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpaddq xmm2, xmm7, xmm0 vpaddq xmm2, xmm7, [rbx] vpaddq xmm2, xmm7, [rbx]{1to2} vpaddq xmm2, xmm7, [rbx+r11*8+256] vpaddq xmm2, xmm7, [rbx+r11*8-256] vpaddq xmm2{k5}, xmm7, xmm0 vpaddq xmm2{k5}, xmm7, [rbx] vpaddq xmm2{k5}, xmm7, [rbx]{1to2} vpaddq xmm2{k5}, xmm7, [rbx+r11*8+256] vpaddq xmm2{k5}, xmm7, [rbx+r11*8-256] vpaddq xmm2{k5}{z}, xmm7, xmm0 vpaddq xmm2{k5}{z}, xmm7, [rbx] vpaddq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpaddq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpaddq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpaddq ymm16, ymm13, ymm15 vpaddq ymm16, ymm13, [rbx] vpaddq ymm16, ymm13, [rbx]{1to4} vpaddq ymm16, ymm13, [rbx+r11*8+256] vpaddq ymm16, ymm13, [rbx+r11*8-256] vpaddq ymm16{k5}, ymm13, ymm15 vpaddq ymm16{k5}, ymm13, [rbx] vpaddq ymm16{k5}, ymm13, [rbx]{1to4} vpaddq ymm16{k5}, ymm13, [rbx+r11*8+256] vpaddq ymm16{k5}, ymm13, [rbx+r11*8-256] vpaddq ymm16{k5}{z}, ymm13, ymm15 vpaddq ymm16{k5}{z}, ymm13, [rbx] vpaddq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpaddq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpaddq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpaddq zmm24, zmm24, zmm31 vpaddq zmm24, zmm24, [rbx] vpaddq zmm24, zmm24, [rbx]{1to8} vpaddq zmm24, zmm24, [rbx+r11*8+256] vpaddq zmm24, zmm24, [rbx+r11*8-256] vpaddq zmm24{k5}, zmm24, zmm31 vpaddq zmm24{k5}, zmm24, [rbx] vpaddq zmm24{k5}, zmm24, [rbx]{1to8} vpaddq zmm24{k5}, zmm24, [rbx+r11*8+256] vpaddq zmm24{k5}, zmm24, [rbx+r11*8-256] vpaddq zmm24{k5}{z}, zmm24, zmm31 vpaddq zmm24{k5}{z}, zmm24, [rbx] vpaddq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpaddq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpaddq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpandd xmm2, xmm7, xmm0 vpandd xmm2, xmm7, [rbx] vpandd xmm2, xmm7, [rbx]{1to4} vpandd xmm2, xmm7, [rbx+r11*8+256] vpandd xmm2, xmm7, [rbx+r11*8-256] vpandd xmm2{k5}, xmm7, xmm0 vpandd xmm2{k5}, xmm7, [rbx] vpandd xmm2{k5}, xmm7, [rbx]{1to4} vpandd xmm2{k5}, xmm7, [rbx+r11*8+256] vpandd xmm2{k5}, xmm7, [rbx+r11*8-256] vpandd xmm2{k5}{z}, xmm7, xmm0 vpandd xmm2{k5}{z}, xmm7, [rbx] vpandd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpandd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpandd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpandd ymm16, ymm13, ymm15 vpandd ymm16, ymm13, [rbx] vpandd ymm16, ymm13, [rbx]{1to8} vpandd ymm16, ymm13, [rbx+r11*8+256] vpandd ymm16, ymm13, [rbx+r11*8-256] vpandd ymm16{k5}, ymm13, ymm15 vpandd ymm16{k5}, ymm13, [rbx] vpandd ymm16{k5}, ymm13, [rbx]{1to8} vpandd ymm16{k5}, ymm13, [rbx+r11*8+256] vpandd ymm16{k5}, ymm13, [rbx+r11*8-256] vpandd ymm16{k5}{z}, ymm13, ymm15 vpandd ymm16{k5}{z}, ymm13, [rbx] vpandd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpandd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpandd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpandd zmm24, zmm24, zmm31 vpandd zmm24, zmm24, [rbx] vpandd zmm24, zmm24, [rbx]{1to16} vpandd zmm24, zmm24, [rbx+r11*8+256] vpandd zmm24, zmm24, [rbx+r11*8-256] vpandd zmm24{k5}, zmm24, zmm31 vpandd zmm24{k5}, zmm24, [rbx] vpandd zmm24{k5}, zmm24, [rbx]{1to16} vpandd zmm24{k5}, zmm24, [rbx+r11*8+256] vpandd zmm24{k5}, zmm24, [rbx+r11*8-256] vpandd zmm24{k5}{z}, zmm24, zmm31 vpandd zmm24{k5}{z}, zmm24, [rbx] vpandd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpandd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpandd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpandnd xmm2, xmm7, xmm0 vpandnd xmm2, xmm7, [rbx] vpandnd xmm2, xmm7, [rbx]{1to4} vpandnd xmm2, xmm7, [rbx+r11*8+256] vpandnd xmm2, xmm7, [rbx+r11*8-256] vpandnd xmm2{k5}, xmm7, xmm0 vpandnd xmm2{k5}, xmm7, [rbx] vpandnd xmm2{k5}, xmm7, [rbx]{1to4} vpandnd xmm2{k5}, xmm7, [rbx+r11*8+256] vpandnd xmm2{k5}, xmm7, [rbx+r11*8-256] vpandnd xmm2{k5}{z}, xmm7, xmm0 vpandnd xmm2{k5}{z}, xmm7, [rbx] vpandnd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpandnd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpandnd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpandnd ymm16, ymm13, ymm15 vpandnd ymm16, ymm13, [rbx] vpandnd ymm16, ymm13, [rbx]{1to8} vpandnd ymm16, ymm13, [rbx+r11*8+256] vpandnd ymm16, ymm13, [rbx+r11*8-256] vpandnd ymm16{k5}, ymm13, ymm15 vpandnd ymm16{k5}, ymm13, [rbx] vpandnd ymm16{k5}, ymm13, [rbx]{1to8} vpandnd ymm16{k5}, ymm13, [rbx+r11*8+256] vpandnd ymm16{k5}, ymm13, [rbx+r11*8-256] vpandnd ymm16{k5}{z}, ymm13, ymm15 vpandnd ymm16{k5}{z}, ymm13, [rbx] vpandnd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpandnd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpandnd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpandnd zmm24, zmm24, zmm31 vpandnd zmm24, zmm24, [rbx] vpandnd zmm24, zmm24, [rbx]{1to16} vpandnd zmm24, zmm24, [rbx+r11*8+256] vpandnd zmm24, zmm24, [rbx+r11*8-256] vpandnd zmm24{k5}, zmm24, zmm31 vpandnd zmm24{k5}, zmm24, [rbx] vpandnd zmm24{k5}, zmm24, [rbx]{1to16} vpandnd zmm24{k5}, zmm24, [rbx+r11*8+256] vpandnd zmm24{k5}, zmm24, [rbx+r11*8-256] vpandnd zmm24{k5}{z}, zmm24, zmm31 vpandnd zmm24{k5}{z}, zmm24, [rbx] vpandnd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpandnd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpandnd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpandnq xmm2, xmm7, xmm0 vpandnq xmm2, xmm7, [rbx] vpandnq xmm2, xmm7, [rbx]{1to2} vpandnq xmm2, xmm7, [rbx+r11*8+256] vpandnq xmm2, xmm7, [rbx+r11*8-256] vpandnq xmm2{k5}, xmm7, xmm0 vpandnq xmm2{k5}, xmm7, [rbx] vpandnq xmm2{k5}, xmm7, [rbx]{1to2} vpandnq xmm2{k5}, xmm7, [rbx+r11*8+256] vpandnq xmm2{k5}, xmm7, [rbx+r11*8-256] vpandnq xmm2{k5}{z}, xmm7, xmm0 vpandnq xmm2{k5}{z}, xmm7, [rbx] vpandnq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpandnq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpandnq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpandnq ymm16, ymm13, ymm15 vpandnq ymm16, ymm13, [rbx] vpandnq ymm16, ymm13, [rbx]{1to4} vpandnq ymm16, ymm13, [rbx+r11*8+256] vpandnq ymm16, ymm13, [rbx+r11*8-256] vpandnq ymm16{k5}, ymm13, ymm15 vpandnq ymm16{k5}, ymm13, [rbx] vpandnq ymm16{k5}, ymm13, [rbx]{1to4} vpandnq ymm16{k5}, ymm13, [rbx+r11*8+256] vpandnq ymm16{k5}, ymm13, [rbx+r11*8-256] vpandnq ymm16{k5}{z}, ymm13, ymm15 vpandnq ymm16{k5}{z}, ymm13, [rbx] vpandnq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpandnq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpandnq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpandnq zmm24, zmm24, zmm31 vpandnq zmm24, zmm24, [rbx] vpandnq zmm24, zmm24, [rbx]{1to8} vpandnq zmm24, zmm24, [rbx+r11*8+256] vpandnq zmm24, zmm24, [rbx+r11*8-256] vpandnq zmm24{k5}, zmm24, zmm31 vpandnq zmm24{k5}, zmm24, [rbx] vpandnq zmm24{k5}, zmm24, [rbx]{1to8} vpandnq zmm24{k5}, zmm24, [rbx+r11*8+256] vpandnq zmm24{k5}, zmm24, [rbx+r11*8-256] vpandnq zmm24{k5}{z}, zmm24, zmm31 vpandnq zmm24{k5}{z}, zmm24, [rbx] vpandnq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpandnq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpandnq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpandq xmm2, xmm7, xmm0 vpandq xmm2, xmm7, [rbx] vpandq xmm2, xmm7, [rbx]{1to2} vpandq xmm2, xmm7, [rbx+r11*8+256] vpandq xmm2, xmm7, [rbx+r11*8-256] vpandq xmm2{k5}, xmm7, xmm0 vpandq xmm2{k5}, xmm7, [rbx] vpandq xmm2{k5}, xmm7, [rbx]{1to2} vpandq xmm2{k5}, xmm7, [rbx+r11*8+256] vpandq xmm2{k5}, xmm7, [rbx+r11*8-256] vpandq xmm2{k5}{z}, xmm7, xmm0 vpandq xmm2{k5}{z}, xmm7, [rbx] vpandq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpandq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpandq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpandq ymm16, ymm13, ymm15 vpandq ymm16, ymm13, [rbx] vpandq ymm16, ymm13, [rbx]{1to4} vpandq ymm16, ymm13, [rbx+r11*8+256] vpandq ymm16, ymm13, [rbx+r11*8-256] vpandq ymm16{k5}, ymm13, ymm15 vpandq ymm16{k5}, ymm13, [rbx] vpandq ymm16{k5}, ymm13, [rbx]{1to4} vpandq ymm16{k5}, ymm13, [rbx+r11*8+256] vpandq ymm16{k5}, ymm13, [rbx+r11*8-256] vpandq ymm16{k5}{z}, ymm13, ymm15 vpandq ymm16{k5}{z}, ymm13, [rbx] vpandq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpandq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpandq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpandq zmm24, zmm24, zmm31 vpandq zmm24, zmm24, [rbx] vpandq zmm24, zmm24, [rbx]{1to8} vpandq zmm24, zmm24, [rbx+r11*8+256] vpandq zmm24, zmm24, [rbx+r11*8-256] vpandq zmm24{k5}, zmm24, zmm31 vpandq zmm24{k5}, zmm24, [rbx] vpandq zmm24{k5}, zmm24, [rbx]{1to8} vpandq zmm24{k5}, zmm24, [rbx+r11*8+256] vpandq zmm24{k5}, zmm24, [rbx+r11*8-256] vpandq zmm24{k5}{z}, zmm24, zmm31 vpandq zmm24{k5}{z}, zmm24, [rbx] vpandq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpandq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpandq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpblendmd xmm2, xmm7, xmm0 vpblendmd xmm2, xmm7, [rbx] vpblendmd xmm2, xmm7, [rbx]{1to4} vpblendmd xmm2, xmm7, [rbx+r11*8+256] vpblendmd xmm2, xmm7, [rbx+r11*8-256] vpblendmd xmm2{k5}, xmm7, xmm0 vpblendmd xmm2{k5}, xmm7, [rbx] vpblendmd xmm2{k5}, xmm7, [rbx]{1to4} vpblendmd xmm2{k5}, xmm7, [rbx+r11*8+256] vpblendmd xmm2{k5}, xmm7, [rbx+r11*8-256] vpblendmd xmm2{k5}{z}, xmm7, xmm0 vpblendmd xmm2{k5}{z}, xmm7, [rbx] vpblendmd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpblendmd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpblendmd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpblendmd ymm16, ymm13, ymm15 vpblendmd ymm16, ymm13, [rbx] vpblendmd ymm16, ymm13, [rbx]{1to8} vpblendmd ymm16, ymm13, [rbx+r11*8+256] vpblendmd ymm16, ymm13, [rbx+r11*8-256] vpblendmd ymm16{k5}, ymm13, ymm15 vpblendmd ymm16{k5}, ymm13, [rbx] vpblendmd ymm16{k5}, ymm13, [rbx]{1to8} vpblendmd ymm16{k5}, ymm13, [rbx+r11*8+256] vpblendmd ymm16{k5}, ymm13, [rbx+r11*8-256] vpblendmd ymm16{k5}{z}, ymm13, ymm15 vpblendmd ymm16{k5}{z}, ymm13, [rbx] vpblendmd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpblendmd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpblendmd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpblendmd zmm24, zmm24, zmm31 vpblendmd zmm24, zmm24, [rbx] vpblendmd zmm24, zmm24, [rbx]{1to16} vpblendmd zmm24, zmm24, [rbx+r11*8+256] vpblendmd zmm24, zmm24, [rbx+r11*8-256] vpblendmd zmm24{k5}, zmm24, zmm31 vpblendmd zmm24{k5}, zmm24, [rbx] vpblendmd zmm24{k5}, zmm24, [rbx]{1to16} vpblendmd zmm24{k5}, zmm24, [rbx+r11*8+256] vpblendmd zmm24{k5}, zmm24, [rbx+r11*8-256] vpblendmd zmm24{k5}{z}, zmm24, zmm31 vpblendmd zmm24{k5}{z}, zmm24, [rbx] vpblendmd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpblendmd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpblendmd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpblendmq xmm2, xmm7, xmm0 vpblendmq xmm2, xmm7, [rbx] vpblendmq xmm2, xmm7, [rbx]{1to2} vpblendmq xmm2, xmm7, [rbx+r11*8+256] vpblendmq xmm2, xmm7, [rbx+r11*8-256] vpblendmq xmm2{k5}, xmm7, xmm0 vpblendmq xmm2{k5}, xmm7, [rbx] vpblendmq xmm2{k5}, xmm7, [rbx]{1to2} vpblendmq xmm2{k5}, xmm7, [rbx+r11*8+256] vpblendmq xmm2{k5}, xmm7, [rbx+r11*8-256] vpblendmq xmm2{k5}{z}, xmm7, xmm0 vpblendmq xmm2{k5}{z}, xmm7, [rbx] vpblendmq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpblendmq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpblendmq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpblendmq ymm16, ymm13, ymm15 vpblendmq ymm16, ymm13, [rbx] vpblendmq ymm16, ymm13, [rbx]{1to4} vpblendmq ymm16, ymm13, [rbx+r11*8+256] vpblendmq ymm16, ymm13, [rbx+r11*8-256] vpblendmq ymm16{k5}, ymm13, ymm15 vpblendmq ymm16{k5}, ymm13, [rbx] vpblendmq ymm16{k5}, ymm13, [rbx]{1to4} vpblendmq ymm16{k5}, ymm13, [rbx+r11*8+256] vpblendmq ymm16{k5}, ymm13, [rbx+r11*8-256] vpblendmq ymm16{k5}{z}, ymm13, ymm15 vpblendmq ymm16{k5}{z}, ymm13, [rbx] vpblendmq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpblendmq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpblendmq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpblendmq zmm24, zmm24, zmm31 vpblendmq zmm24, zmm24, [rbx] vpblendmq zmm24, zmm24, [rbx]{1to8} vpblendmq zmm24, zmm24, [rbx+r11*8+256] vpblendmq zmm24, zmm24, [rbx+r11*8-256] vpblendmq zmm24{k5}, zmm24, zmm31 vpblendmq zmm24{k5}, zmm24, [rbx] vpblendmq zmm24{k5}, zmm24, [rbx]{1to8} vpblendmq zmm24{k5}, zmm24, [rbx+r11*8+256] vpblendmq zmm24{k5}, zmm24, [rbx+r11*8-256] vpblendmq zmm24{k5}{z}, zmm24, zmm31 vpblendmq zmm24{k5}{z}, zmm24, [rbx] vpblendmq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpblendmq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpblendmq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpbroadcastd xmm2, xmm0 vpbroadcastd xmm2, [rbx] vpbroadcastd xmm2, [rbx+r11*8+256] vpbroadcastd xmm2, [rbx+r11*8-256] vpbroadcastd xmm2{k5}, xmm0 vpbroadcastd xmm2{k5}, [rbx] vpbroadcastd xmm2{k5}, [rbx+r11*8+256] vpbroadcastd xmm2{k5}, [rbx+r11*8-256] vpbroadcastd xmm2{k5}{z}, xmm0 vpbroadcastd xmm2{k5}{z}, [rbx] vpbroadcastd xmm2{k5}{z}, [rbx+r11*8+256] vpbroadcastd xmm2{k5}{z}, [rbx+r11*8-256] vpbroadcastd ymm16, xmm0 vpbroadcastd ymm16, [rbx] vpbroadcastd ymm16, [rbx+r11*8+256] vpbroadcastd ymm16, [rbx+r11*8-256] vpbroadcastd ymm16{k5}, xmm0 vpbroadcastd ymm16{k5}, [rbx] vpbroadcastd ymm16{k5}, [rbx+r11*8+256] vpbroadcastd ymm16{k5}, [rbx+r11*8-256] vpbroadcastd ymm16{k5}{z}, xmm0 vpbroadcastd ymm16{k5}{z}, [rbx] vpbroadcastd ymm16{k5}{z}, [rbx+r11*8+256] vpbroadcastd ymm16{k5}{z}, [rbx+r11*8-256] vpbroadcastd zmm24, xmm0 vpbroadcastd zmm24, [rbx] vpbroadcastd zmm24, [rbx+r11*8+256] vpbroadcastd zmm24, [rbx+r11*8-256] vpbroadcastd zmm24{k5}, xmm0 vpbroadcastd zmm24{k5}, [rbx] vpbroadcastd zmm24{k5}, [rbx+r11*8+256] vpbroadcastd zmm24{k5}, [rbx+r11*8-256] vpbroadcastd zmm24{k5}{z}, xmm0 vpbroadcastd zmm24{k5}{z}, [rbx] vpbroadcastd zmm24{k5}{z}, [rbx+r11*8+256] vpbroadcastd zmm24{k5}{z}, [rbx+r11*8-256] vpbroadcastd xmm2, ecx vpbroadcastd xmm2{k5}, ecx vpbroadcastd xmm2{k5}{z}, ecx vpbroadcastd ymm16, ecx vpbroadcastd ymm16{k5}, ecx vpbroadcastd ymm16{k5}{z}, ecx vpbroadcastd zmm24, ecx vpbroadcastd zmm24{k5}, ecx vpbroadcastd zmm24{k5}{z}, ecx vpbroadcastq xmm2, xmm0 vpbroadcastq xmm2, [rbx] vpbroadcastq xmm2, [rbx+r11*8+256] vpbroadcastq xmm2, [rbx+r11*8-256] vpbroadcastq xmm2{k5}, xmm0 vpbroadcastq xmm2{k5}, [rbx] vpbroadcastq xmm2{k5}, [rbx+r11*8+256] vpbroadcastq xmm2{k5}, [rbx+r11*8-256] vpbroadcastq xmm2{k5}{z}, xmm0 vpbroadcastq xmm2{k5}{z}, [rbx] vpbroadcastq xmm2{k5}{z}, [rbx+r11*8+256] vpbroadcastq xmm2{k5}{z}, [rbx+r11*8-256] vpbroadcastq ymm16, xmm0 vpbroadcastq ymm16, [rbx] vpbroadcastq ymm16, [rbx+r11*8+256] vpbroadcastq ymm16, [rbx+r11*8-256] vpbroadcastq ymm16{k5}, xmm0 vpbroadcastq ymm16{k5}, [rbx] vpbroadcastq ymm16{k5}, [rbx+r11*8+256] vpbroadcastq ymm16{k5}, [rbx+r11*8-256] vpbroadcastq ymm16{k5}{z}, xmm0 vpbroadcastq ymm16{k5}{z}, [rbx] vpbroadcastq ymm16{k5}{z}, [rbx+r11*8+256] vpbroadcastq ymm16{k5}{z}, [rbx+r11*8-256] vpbroadcastq zmm24, xmm0 vpbroadcastq zmm24, [rbx] vpbroadcastq zmm24, [rbx+r11*8+256] vpbroadcastq zmm24, [rbx+r11*8-256] vpbroadcastq zmm24{k5}, xmm0 vpbroadcastq zmm24{k5}, [rbx] vpbroadcastq zmm24{k5}, [rbx+r11*8+256] vpbroadcastq zmm24{k5}, [rbx+r11*8-256] vpbroadcastq zmm24{k5}{z}, xmm0 vpbroadcastq zmm24{k5}{z}, [rbx] vpbroadcastq zmm24{k5}{z}, [rbx+r11*8+256] vpbroadcastq zmm24{k5}{z}, [rbx+r11*8-256] vpbroadcastq xmm2, rcx vpbroadcastq xmm2{k5}, rcx vpbroadcastq xmm2{k5}{z}, rcx vpbroadcastq ymm16, rcx vpbroadcastq ymm16{k5}, rcx vpbroadcastq ymm16{k5}{z}, rcx vpbroadcastq zmm24, rcx vpbroadcastq zmm24{k5}, rcx vpbroadcastq zmm24{k5}{z}, rcx vpcmpd k3, xmm7, xmm0, 10 vpcmpd k3, xmm7, [rbx], 10 vpcmpd k3, xmm7, [rbx]{1to4}, 10 vpcmpd k3, xmm7, [rbx+r11*8+256], 10 vpcmpd k3, xmm7, [rbx+r11*8-256], 10 vpcmpd k3, ymm13, ymm15, 10 vpcmpd k3, ymm13, [rbx], 10 vpcmpd k3, ymm13, [rbx]{1to8}, 10 vpcmpd k3, ymm13, [rbx+r11*8+256], 10 vpcmpd k3, ymm13, [rbx+r11*8-256], 10 vpcmpd k3, zmm24, zmm31, 10 vpcmpd k3, zmm24, [rbx], 10 vpcmpd k3, zmm24, [rbx]{1to16}, 10 vpcmpd k3, zmm24, [rbx+r11*8+256], 10 vpcmpd k3, zmm24, [rbx+r11*8-256], 10 vpcmpd k3{k5}, xmm7, xmm0, 10 vpcmpd k3{k5}, xmm7, [rbx], 10 vpcmpd k3{k5}, xmm7, [rbx]{1to4}, 10 vpcmpd k3{k5}, xmm7, [rbx+r11*8+256], 10 vpcmpd k3{k5}, xmm7, [rbx+r11*8-256], 10 vpcmpd k3{k5}, ymm13, ymm15, 10 vpcmpd k3{k5}, ymm13, [rbx], 10 vpcmpd k3{k5}, ymm13, [rbx]{1to8}, 10 vpcmpd k3{k5}, ymm13, [rbx+r11*8+256], 10 vpcmpd k3{k5}, ymm13, [rbx+r11*8-256], 10 vpcmpd k3{k5}, zmm24, zmm31, 10 vpcmpd k3{k5}, zmm24, [rbx], 10 vpcmpd k3{k5}, zmm24, [rbx]{1to16}, 10 vpcmpd k3{k5}, zmm24, [rbx+r11*8+256], 10 vpcmpd k3{k5}, zmm24, [rbx+r11*8-256], 10 vpcmpeqd k3, xmm7, xmm0 vpcmpeqd k3, xmm7, [rbx] vpcmpeqd k3, xmm7, [rbx]{1to4} vpcmpeqd k3, xmm7, [rbx+r11*8+256] vpcmpeqd k3, xmm7, [rbx+r11*8-256] vpcmpeqd k3, ymm13, ymm15 vpcmpeqd k3, ymm13, [rbx] vpcmpeqd k3, ymm13, [rbx]{1to8} vpcmpeqd k3, ymm13, [rbx+r11*8+256] vpcmpeqd k3, ymm13, [rbx+r11*8-256] vpcmpeqd k3, zmm24, zmm31 vpcmpeqd k3, zmm24, [rbx] vpcmpeqd k3, zmm24, [rbx]{1to16} vpcmpeqd k3, zmm24, [rbx+r11*8+256] vpcmpeqd k3, zmm24, [rbx+r11*8-256] vpcmpeqd k3{k5}, xmm7, xmm0 vpcmpeqd k3{k5}, xmm7, [rbx] vpcmpeqd k3{k5}, xmm7, [rbx]{1to4} vpcmpeqd k3{k5}, xmm7, [rbx+r11*8+256] vpcmpeqd k3{k5}, xmm7, [rbx+r11*8-256] vpcmpeqd k3{k5}, ymm13, ymm15 vpcmpeqd k3{k5}, ymm13, [rbx] vpcmpeqd k3{k5}, ymm13, [rbx]{1to8} vpcmpeqd k3{k5}, ymm13, [rbx+r11*8+256] vpcmpeqd k3{k5}, ymm13, [rbx+r11*8-256] vpcmpeqd k3{k5}, zmm24, zmm31 vpcmpeqd k3{k5}, zmm24, [rbx] vpcmpeqd k3{k5}, zmm24, [rbx]{1to16} vpcmpeqd k3{k5}, zmm24, [rbx+r11*8+256] vpcmpeqd k3{k5}, zmm24, [rbx+r11*8-256] vpcmpeqq k3, xmm7, xmm0 vpcmpeqq k3, xmm7, [rbx] vpcmpeqq k3, xmm7, [rbx]{1to2} vpcmpeqq k3, xmm7, [rbx+r11*8+256] vpcmpeqq k3, xmm7, [rbx+r11*8-256] vpcmpeqq k3, ymm13, ymm15 vpcmpeqq k3, ymm13, [rbx] vpcmpeqq k3, ymm13, [rbx]{1to4} vpcmpeqq k3, ymm13, [rbx+r11*8+256] vpcmpeqq k3, ymm13, [rbx+r11*8-256] vpcmpeqq k3, zmm24, zmm31 vpcmpeqq k3, zmm24, [rbx] vpcmpeqq k3, zmm24, [rbx]{1to8} vpcmpeqq k3, zmm24, [rbx+r11*8+256] vpcmpeqq k3, zmm24, [rbx+r11*8-256] vpcmpeqq k3{k5}, xmm7, xmm0 vpcmpeqq k3{k5}, xmm7, [rbx] vpcmpeqq k3{k5}, xmm7, [rbx]{1to2} vpcmpeqq k3{k5}, xmm7, [rbx+r11*8+256] vpcmpeqq k3{k5}, xmm7, [rbx+r11*8-256] vpcmpeqq k3{k5}, ymm13, ymm15 vpcmpeqq k3{k5}, ymm13, [rbx] vpcmpeqq k3{k5}, ymm13, [rbx]{1to4} vpcmpeqq k3{k5}, ymm13, [rbx+r11*8+256] vpcmpeqq k3{k5}, ymm13, [rbx+r11*8-256] vpcmpeqq k3{k5}, zmm24, zmm31 vpcmpeqq k3{k5}, zmm24, [rbx] vpcmpeqq k3{k5}, zmm24, [rbx]{1to8} vpcmpeqq k3{k5}, zmm24, [rbx+r11*8+256] vpcmpeqq k3{k5}, zmm24, [rbx+r11*8-256] vpcmpgtd k3, xmm7, xmm0 vpcmpgtd k3, xmm7, [rbx] vpcmpgtd k3, xmm7, [rbx]{1to4} vpcmpgtd k3, xmm7, [rbx+r11*8+256] vpcmpgtd k3, xmm7, [rbx+r11*8-256] vpcmpgtd k3, ymm13, ymm15 vpcmpgtd k3, ymm13, [rbx] vpcmpgtd k3, ymm13, [rbx]{1to8} vpcmpgtd k3, ymm13, [rbx+r11*8+256] vpcmpgtd k3, ymm13, [rbx+r11*8-256] vpcmpgtd k3, zmm24, zmm31 vpcmpgtd k3, zmm24, [rbx] vpcmpgtd k3, zmm24, [rbx]{1to16} vpcmpgtd k3, zmm24, [rbx+r11*8+256] vpcmpgtd k3, zmm24, [rbx+r11*8-256] vpcmpgtd k3{k5}, xmm7, xmm0 vpcmpgtd k3{k5}, xmm7, [rbx] vpcmpgtd k3{k5}, xmm7, [rbx]{1to4} vpcmpgtd k3{k5}, xmm7, [rbx+r11*8+256] vpcmpgtd k3{k5}, xmm7, [rbx+r11*8-256] vpcmpgtd k3{k5}, ymm13, ymm15 vpcmpgtd k3{k5}, ymm13, [rbx] vpcmpgtd k3{k5}, ymm13, [rbx]{1to8} vpcmpgtd k3{k5}, ymm13, [rbx+r11*8+256] vpcmpgtd k3{k5}, ymm13, [rbx+r11*8-256] vpcmpgtd k3{k5}, zmm24, zmm31 vpcmpgtd k3{k5}, zmm24, [rbx] vpcmpgtd k3{k5}, zmm24, [rbx]{1to16} vpcmpgtd k3{k5}, zmm24, [rbx+r11*8+256] vpcmpgtd k3{k5}, zmm24, [rbx+r11*8-256] vpcmpgtq k3, xmm7, xmm0 vpcmpgtq k3, xmm7, [rbx] vpcmpgtq k3, xmm7, [rbx]{1to2} vpcmpgtq k3, xmm7, [rbx+r11*8+256] vpcmpgtq k3, xmm7, [rbx+r11*8-256] vpcmpgtq k3, ymm13, ymm15 vpcmpgtq k3, ymm13, [rbx] vpcmpgtq k3, ymm13, [rbx]{1to4} vpcmpgtq k3, ymm13, [rbx+r11*8+256] vpcmpgtq k3, ymm13, [rbx+r11*8-256] vpcmpgtq k3, zmm24, zmm31 vpcmpgtq k3, zmm24, [rbx] vpcmpgtq k3, zmm24, [rbx]{1to8} vpcmpgtq k3, zmm24, [rbx+r11*8+256] vpcmpgtq k3, zmm24, [rbx+r11*8-256] vpcmpgtq k3{k5}, xmm7, xmm0 vpcmpgtq k3{k5}, xmm7, [rbx] vpcmpgtq k3{k5}, xmm7, [rbx]{1to2} vpcmpgtq k3{k5}, xmm7, [rbx+r11*8+256] vpcmpgtq k3{k5}, xmm7, [rbx+r11*8-256] vpcmpgtq k3{k5}, ymm13, ymm15 vpcmpgtq k3{k5}, ymm13, [rbx] vpcmpgtq k3{k5}, ymm13, [rbx]{1to4} vpcmpgtq k3{k5}, ymm13, [rbx+r11*8+256] vpcmpgtq k3{k5}, ymm13, [rbx+r11*8-256] vpcmpgtq k3{k5}, zmm24, zmm31 vpcmpgtq k3{k5}, zmm24, [rbx] vpcmpgtq k3{k5}, zmm24, [rbx]{1to8} vpcmpgtq k3{k5}, zmm24, [rbx+r11*8+256] vpcmpgtq k3{k5}, zmm24, [rbx+r11*8-256] vpcmpq k3, xmm7, xmm0, 10 vpcmpq k3, xmm7, [rbx], 10 vpcmpq k3, xmm7, [rbx]{1to2}, 10 vpcmpq k3, xmm7, [rbx+r11*8+256], 10 vpcmpq k3, xmm7, [rbx+r11*8-256], 10 vpcmpq k3, ymm13, ymm15, 10 vpcmpq k3, ymm13, [rbx], 10 vpcmpq k3, ymm13, [rbx]{1to4}, 10 vpcmpq k3, ymm13, [rbx+r11*8+256], 10 vpcmpq k3, ymm13, [rbx+r11*8-256], 10 vpcmpq k3, zmm24, zmm31, 10 vpcmpq k3, zmm24, [rbx], 10 vpcmpq k3, zmm24, [rbx]{1to8}, 10 vpcmpq k3, zmm24, [rbx+r11*8+256], 10 vpcmpq k3, zmm24, [rbx+r11*8-256], 10 vpcmpq k3{k5}, xmm7, xmm0, 10 vpcmpq k3{k5}, xmm7, [rbx], 10 vpcmpq k3{k5}, xmm7, [rbx]{1to2}, 10 vpcmpq k3{k5}, xmm7, [rbx+r11*8+256], 10 vpcmpq k3{k5}, xmm7, [rbx+r11*8-256], 10 vpcmpq k3{k5}, ymm13, ymm15, 10 vpcmpq k3{k5}, ymm13, [rbx], 10 vpcmpq k3{k5}, ymm13, [rbx]{1to4}, 10 vpcmpq k3{k5}, ymm13, [rbx+r11*8+256], 10 vpcmpq k3{k5}, ymm13, [rbx+r11*8-256], 10 vpcmpq k3{k5}, zmm24, zmm31, 10 vpcmpq k3{k5}, zmm24, [rbx], 10 vpcmpq k3{k5}, zmm24, [rbx]{1to8}, 10 vpcmpq k3{k5}, zmm24, [rbx+r11*8+256], 10 vpcmpq k3{k5}, zmm24, [rbx+r11*8-256], 10 vpcmpud k3, xmm7, xmm0, 10 vpcmpud k3, xmm7, [rbx], 10 vpcmpud k3, xmm7, [rbx]{1to4}, 10 vpcmpud k3, xmm7, [rbx+r11*8+256], 10 vpcmpud k3, xmm7, [rbx+r11*8-256], 10 vpcmpud k3, ymm13, ymm15, 10 vpcmpud k3, ymm13, [rbx], 10 vpcmpud k3, ymm13, [rbx]{1to8}, 10 vpcmpud k3, ymm13, [rbx+r11*8+256], 10 vpcmpud k3, ymm13, [rbx+r11*8-256], 10 vpcmpud k3, zmm24, zmm31, 10 vpcmpud k3, zmm24, [rbx], 10 vpcmpud k3, zmm24, [rbx]{1to16}, 10 vpcmpud k3, zmm24, [rbx+r11*8+256], 10 vpcmpud k3, zmm24, [rbx+r11*8-256], 10 vpcmpud k3{k5}, xmm7, xmm0, 10 vpcmpud k3{k5}, xmm7, [rbx], 10 vpcmpud k3{k5}, xmm7, [rbx]{1to4}, 10 vpcmpud k3{k5}, xmm7, [rbx+r11*8+256], 10 vpcmpud k3{k5}, xmm7, [rbx+r11*8-256], 10 vpcmpud k3{k5}, ymm13, ymm15, 10 vpcmpud k3{k5}, ymm13, [rbx], 10 vpcmpud k3{k5}, ymm13, [rbx]{1to8}, 10 vpcmpud k3{k5}, ymm13, [rbx+r11*8+256], 10 vpcmpud k3{k5}, ymm13, [rbx+r11*8-256], 10 vpcmpud k3{k5}, zmm24, zmm31, 10 vpcmpud k3{k5}, zmm24, [rbx], 10 vpcmpud k3{k5}, zmm24, [rbx]{1to16}, 10 vpcmpud k3{k5}, zmm24, [rbx+r11*8+256], 10 vpcmpud k3{k5}, zmm24, [rbx+r11*8-256], 10 vpcmpuq k3, xmm7, xmm0, 10 vpcmpuq k3, xmm7, [rbx], 10 vpcmpuq k3, xmm7, [rbx]{1to2}, 10 vpcmpuq k3, xmm7, [rbx+r11*8+256], 10 vpcmpuq k3, xmm7, [rbx+r11*8-256], 10 vpcmpuq k3, ymm13, ymm15, 10 vpcmpuq k3, ymm13, [rbx], 10 vpcmpuq k3, ymm13, [rbx]{1to4}, 10 vpcmpuq k3, ymm13, [rbx+r11*8+256], 10 vpcmpuq k3, ymm13, [rbx+r11*8-256], 10 vpcmpuq k3, zmm24, zmm31, 10 vpcmpuq k3, zmm24, [rbx], 10 vpcmpuq k3, zmm24, [rbx]{1to8}, 10 vpcmpuq k3, zmm24, [rbx+r11*8+256], 10 vpcmpuq k3, zmm24, [rbx+r11*8-256], 10 vpcmpuq k3{k5}, xmm7, xmm0, 10 vpcmpuq k3{k5}, xmm7, [rbx], 10 vpcmpuq k3{k5}, xmm7, [rbx]{1to2}, 10 vpcmpuq k3{k5}, xmm7, [rbx+r11*8+256], 10 vpcmpuq k3{k5}, xmm7, [rbx+r11*8-256], 10 vpcmpuq k3{k5}, ymm13, ymm15, 10 vpcmpuq k3{k5}, ymm13, [rbx], 10 vpcmpuq k3{k5}, ymm13, [rbx]{1to4}, 10 vpcmpuq k3{k5}, ymm13, [rbx+r11*8+256], 10 vpcmpuq k3{k5}, ymm13, [rbx+r11*8-256], 10 vpcmpuq k3{k5}, zmm24, zmm31, 10 vpcmpuq k3{k5}, zmm24, [rbx], 10 vpcmpuq k3{k5}, zmm24, [rbx]{1to8}, 10 vpcmpuq k3{k5}, zmm24, [rbx+r11*8+256], 10 vpcmpuq k3{k5}, zmm24, [rbx+r11*8-256], 10 vpcompressd xmm0, xmm2 vpcompressd ymm15, ymm16 vpcompressd zmm31, zmm24 vpcompressd [rbx], xmm2 vpcompressd [rbx], ymm16 vpcompressd [rbx], zmm24 vpcompressd [rbx+r11*8+256], xmm2 vpcompressd [rbx+r11*8+256], ymm16 vpcompressd [rbx+r11*8+256], zmm24 vpcompressd [rbx+r11*8-256], xmm2 vpcompressd [rbx+r11*8-256], ymm16 vpcompressd [rbx+r11*8-256], zmm24 vpcompressq xmm0, xmm2 vpcompressq ymm15, ymm16 vpcompressq zmm31, zmm24 vpcompressq [rbx], xmm2 vpcompressq [rbx], ymm16 vpcompressq [rbx], zmm24 vpcompressq [rbx+r11*8+256], xmm2 vpcompressq [rbx+r11*8+256], ymm16 vpcompressq [rbx+r11*8+256], zmm24 vpcompressq [rbx+r11*8-256], xmm2 vpcompressq [rbx+r11*8-256], ymm16 vpcompressq [rbx+r11*8-256], zmm24 vpermd ymm16, ymm13, ymm15 vpermd ymm16, ymm13, [rbx] vpermd ymm16, ymm13, [rbx]{1to8} vpermd ymm16, ymm13, [rbx+r11*8+256] vpermd ymm16, ymm13, [rbx+r11*8-256] vpermd ymm16{k5}, ymm13, ymm15 vpermd ymm16{k5}, ymm13, [rbx] vpermd ymm16{k5}, ymm13, [rbx]{1to8} vpermd ymm16{k5}, ymm13, [rbx+r11*8+256] vpermd ymm16{k5}, ymm13, [rbx+r11*8-256] vpermd ymm16{k5}{z}, ymm13, ymm15 vpermd ymm16{k5}{z}, ymm13, [rbx] vpermd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpermd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermd zmm24, zmm24, zmm31 vpermd zmm24, zmm24, [rbx] vpermd zmm24, zmm24, [rbx]{1to16} vpermd zmm24, zmm24, [rbx+r11*8+256] vpermd zmm24, zmm24, [rbx+r11*8-256] vpermd zmm24{k5}, zmm24, zmm31 vpermd zmm24{k5}, zmm24, [rbx] vpermd zmm24{k5}, zmm24, [rbx]{1to16} vpermd zmm24{k5}, zmm24, [rbx+r11*8+256] vpermd zmm24{k5}, zmm24, [rbx+r11*8-256] vpermd zmm24{k5}{z}, zmm24, zmm31 vpermd zmm24{k5}{z}, zmm24, [rbx] vpermd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpermd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermi2d xmm2, xmm7, xmm0 vpermi2d xmm2, xmm7, [rbx] vpermi2d xmm2, xmm7, [rbx]{1to4} vpermi2d xmm2, xmm7, [rbx+r11*8+256] vpermi2d xmm2, xmm7, [rbx+r11*8-256] vpermi2d xmm2{k5}, xmm7, xmm0 vpermi2d xmm2{k5}, xmm7, [rbx] vpermi2d xmm2{k5}, xmm7, [rbx]{1to4} vpermi2d xmm2{k5}, xmm7, [rbx+r11*8+256] vpermi2d xmm2{k5}, xmm7, [rbx+r11*8-256] vpermi2d xmm2{k5}{z}, xmm7, xmm0 vpermi2d xmm2{k5}{z}, xmm7, [rbx] vpermi2d xmm2{k5}{z}, xmm7, [rbx]{1to4} vpermi2d xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermi2d xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermi2d ymm16, ymm13, ymm15 vpermi2d ymm16, ymm13, [rbx] vpermi2d ymm16, ymm13, [rbx]{1to8} vpermi2d ymm16, ymm13, [rbx+r11*8+256] vpermi2d ymm16, ymm13, [rbx+r11*8-256] vpermi2d ymm16{k5}, ymm13, ymm15 vpermi2d ymm16{k5}, ymm13, [rbx] vpermi2d ymm16{k5}, ymm13, [rbx]{1to8} vpermi2d ymm16{k5}, ymm13, [rbx+r11*8+256] vpermi2d ymm16{k5}, ymm13, [rbx+r11*8-256] vpermi2d ymm16{k5}{z}, ymm13, ymm15 vpermi2d ymm16{k5}{z}, ymm13, [rbx] vpermi2d ymm16{k5}{z}, ymm13, [rbx]{1to8} vpermi2d ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermi2d ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermi2d zmm24, zmm24, zmm31 vpermi2d zmm24, zmm24, [rbx] vpermi2d zmm24, zmm24, [rbx]{1to16} vpermi2d zmm24, zmm24, [rbx+r11*8+256] vpermi2d zmm24, zmm24, [rbx+r11*8-256] vpermi2d zmm24{k5}, zmm24, zmm31 vpermi2d zmm24{k5}, zmm24, [rbx] vpermi2d zmm24{k5}, zmm24, [rbx]{1to16} vpermi2d zmm24{k5}, zmm24, [rbx+r11*8+256] vpermi2d zmm24{k5}, zmm24, [rbx+r11*8-256] vpermi2d zmm24{k5}{z}, zmm24, zmm31 vpermi2d zmm24{k5}{z}, zmm24, [rbx] vpermi2d zmm24{k5}{z}, zmm24, [rbx]{1to16} vpermi2d zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermi2d zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermi2pd xmm2, xmm7, xmm0 vpermi2pd xmm2, xmm7, [rbx] vpermi2pd xmm2, xmm7, [rbx]{1to2} vpermi2pd xmm2, xmm7, [rbx+r11*8+256] vpermi2pd xmm2, xmm7, [rbx+r11*8-256] vpermi2pd xmm2{k5}, xmm7, xmm0 vpermi2pd xmm2{k5}, xmm7, [rbx] vpermi2pd xmm2{k5}, xmm7, [rbx]{1to2} vpermi2pd xmm2{k5}, xmm7, [rbx+r11*8+256] vpermi2pd xmm2{k5}, xmm7, [rbx+r11*8-256] vpermi2pd xmm2{k5}{z}, xmm7, xmm0 vpermi2pd xmm2{k5}{z}, xmm7, [rbx] vpermi2pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vpermi2pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermi2pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermi2pd ymm16, ymm13, ymm15 vpermi2pd ymm16, ymm13, [rbx] vpermi2pd ymm16, ymm13, [rbx]{1to4} vpermi2pd ymm16, ymm13, [rbx+r11*8+256] vpermi2pd ymm16, ymm13, [rbx+r11*8-256] vpermi2pd ymm16{k5}, ymm13, ymm15 vpermi2pd ymm16{k5}, ymm13, [rbx] vpermi2pd ymm16{k5}, ymm13, [rbx]{1to4} vpermi2pd ymm16{k5}, ymm13, [rbx+r11*8+256] vpermi2pd ymm16{k5}, ymm13, [rbx+r11*8-256] vpermi2pd ymm16{k5}{z}, ymm13, ymm15 vpermi2pd ymm16{k5}{z}, ymm13, [rbx] vpermi2pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vpermi2pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermi2pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermi2pd zmm24, zmm24, zmm31 vpermi2pd zmm24, zmm24, [rbx] vpermi2pd zmm24, zmm24, [rbx]{1to8} vpermi2pd zmm24, zmm24, [rbx+r11*8+256] vpermi2pd zmm24, zmm24, [rbx+r11*8-256] vpermi2pd zmm24{k5}, zmm24, zmm31 vpermi2pd zmm24{k5}, zmm24, [rbx] vpermi2pd zmm24{k5}, zmm24, [rbx]{1to8} vpermi2pd zmm24{k5}, zmm24, [rbx+r11*8+256] vpermi2pd zmm24{k5}, zmm24, [rbx+r11*8-256] vpermi2pd zmm24{k5}{z}, zmm24, zmm31 vpermi2pd zmm24{k5}{z}, zmm24, [rbx] vpermi2pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vpermi2pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermi2pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermi2ps xmm2, xmm7, xmm0 vpermi2ps xmm2, xmm7, [rbx] vpermi2ps xmm2, xmm7, [rbx]{1to4} vpermi2ps xmm2, xmm7, [rbx+r11*8+256] vpermi2ps xmm2, xmm7, [rbx+r11*8-256] vpermi2ps xmm2{k5}, xmm7, xmm0 vpermi2ps xmm2{k5}, xmm7, [rbx] vpermi2ps xmm2{k5}, xmm7, [rbx]{1to4} vpermi2ps xmm2{k5}, xmm7, [rbx+r11*8+256] vpermi2ps xmm2{k5}, xmm7, [rbx+r11*8-256] vpermi2ps xmm2{k5}{z}, xmm7, xmm0 vpermi2ps xmm2{k5}{z}, xmm7, [rbx] vpermi2ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vpermi2ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermi2ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermi2ps ymm16, ymm13, ymm15 vpermi2ps ymm16, ymm13, [rbx] vpermi2ps ymm16, ymm13, [rbx]{1to8} vpermi2ps ymm16, ymm13, [rbx+r11*8+256] vpermi2ps ymm16, ymm13, [rbx+r11*8-256] vpermi2ps ymm16{k5}, ymm13, ymm15 vpermi2ps ymm16{k5}, ymm13, [rbx] vpermi2ps ymm16{k5}, ymm13, [rbx]{1to8} vpermi2ps ymm16{k5}, ymm13, [rbx+r11*8+256] vpermi2ps ymm16{k5}, ymm13, [rbx+r11*8-256] vpermi2ps ymm16{k5}{z}, ymm13, ymm15 vpermi2ps ymm16{k5}{z}, ymm13, [rbx] vpermi2ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vpermi2ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermi2ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermi2ps zmm24, zmm24, zmm31 vpermi2ps zmm24, zmm24, [rbx] vpermi2ps zmm24, zmm24, [rbx]{1to16} vpermi2ps zmm24, zmm24, [rbx+r11*8+256] vpermi2ps zmm24, zmm24, [rbx+r11*8-256] vpermi2ps zmm24{k5}, zmm24, zmm31 vpermi2ps zmm24{k5}, zmm24, [rbx] vpermi2ps zmm24{k5}, zmm24, [rbx]{1to16} vpermi2ps zmm24{k5}, zmm24, [rbx+r11*8+256] vpermi2ps zmm24{k5}, zmm24, [rbx+r11*8-256] vpermi2ps zmm24{k5}{z}, zmm24, zmm31 vpermi2ps zmm24{k5}{z}, zmm24, [rbx] vpermi2ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vpermi2ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermi2ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermi2q xmm2, xmm7, xmm0 vpermi2q xmm2, xmm7, [rbx] vpermi2q xmm2, xmm7, [rbx]{1to2} vpermi2q xmm2, xmm7, [rbx+r11*8+256] vpermi2q xmm2, xmm7, [rbx+r11*8-256] vpermi2q xmm2{k5}, xmm7, xmm0 vpermi2q xmm2{k5}, xmm7, [rbx] vpermi2q xmm2{k5}, xmm7, [rbx]{1to2} vpermi2q xmm2{k5}, xmm7, [rbx+r11*8+256] vpermi2q xmm2{k5}, xmm7, [rbx+r11*8-256] vpermi2q xmm2{k5}{z}, xmm7, xmm0 vpermi2q xmm2{k5}{z}, xmm7, [rbx] vpermi2q xmm2{k5}{z}, xmm7, [rbx]{1to2} vpermi2q xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermi2q xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermi2q ymm16, ymm13, ymm15 vpermi2q ymm16, ymm13, [rbx] vpermi2q ymm16, ymm13, [rbx]{1to4} vpermi2q ymm16, ymm13, [rbx+r11*8+256] vpermi2q ymm16, ymm13, [rbx+r11*8-256] vpermi2q ymm16{k5}, ymm13, ymm15 vpermi2q ymm16{k5}, ymm13, [rbx] vpermi2q ymm16{k5}, ymm13, [rbx]{1to4} vpermi2q ymm16{k5}, ymm13, [rbx+r11*8+256] vpermi2q ymm16{k5}, ymm13, [rbx+r11*8-256] vpermi2q ymm16{k5}{z}, ymm13, ymm15 vpermi2q ymm16{k5}{z}, ymm13, [rbx] vpermi2q ymm16{k5}{z}, ymm13, [rbx]{1to4} vpermi2q ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermi2q ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermi2q zmm24, zmm24, zmm31 vpermi2q zmm24, zmm24, [rbx] vpermi2q zmm24, zmm24, [rbx]{1to8} vpermi2q zmm24, zmm24, [rbx+r11*8+256] vpermi2q zmm24, zmm24, [rbx+r11*8-256] vpermi2q zmm24{k5}, zmm24, zmm31 vpermi2q zmm24{k5}, zmm24, [rbx] vpermi2q zmm24{k5}, zmm24, [rbx]{1to8} vpermi2q zmm24{k5}, zmm24, [rbx+r11*8+256] vpermi2q zmm24{k5}, zmm24, [rbx+r11*8-256] vpermi2q zmm24{k5}{z}, zmm24, zmm31 vpermi2q zmm24{k5}{z}, zmm24, [rbx] vpermi2q zmm24{k5}{z}, zmm24, [rbx]{1to8} vpermi2q zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermi2q zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermilpd xmm2, xmm7, xmm0 vpermilpd xmm2, xmm7, [rbx] vpermilpd xmm2, xmm7, [rbx]{1to2} vpermilpd xmm2, xmm7, [rbx+r11*8+256] vpermilpd xmm2, xmm7, [rbx+r11*8-256] vpermilpd xmm2{k5}, xmm7, xmm0 vpermilpd xmm2{k5}, xmm7, [rbx] vpermilpd xmm2{k5}, xmm7, [rbx]{1to2} vpermilpd xmm2{k5}, xmm7, [rbx+r11*8+256] vpermilpd xmm2{k5}, xmm7, [rbx+r11*8-256] vpermilpd xmm2{k5}{z}, xmm7, xmm0 vpermilpd xmm2{k5}{z}, xmm7, [rbx] vpermilpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vpermilpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermilpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermilpd ymm16, ymm13, ymm15 vpermilpd ymm16, ymm13, [rbx] vpermilpd ymm16, ymm13, [rbx]{1to4} vpermilpd ymm16, ymm13, [rbx+r11*8+256] vpermilpd ymm16, ymm13, [rbx+r11*8-256] vpermilpd ymm16{k5}, ymm13, ymm15 vpermilpd ymm16{k5}, ymm13, [rbx] vpermilpd ymm16{k5}, ymm13, [rbx]{1to4} vpermilpd ymm16{k5}, ymm13, [rbx+r11*8+256] vpermilpd ymm16{k5}, ymm13, [rbx+r11*8-256] vpermilpd ymm16{k5}{z}, ymm13, ymm15 vpermilpd ymm16{k5}{z}, ymm13, [rbx] vpermilpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vpermilpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermilpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermilpd zmm24, zmm24, zmm31 vpermilpd zmm24, zmm24, [rbx] vpermilpd zmm24, zmm24, [rbx]{1to8} vpermilpd zmm24, zmm24, [rbx+r11*8+256] vpermilpd zmm24, zmm24, [rbx+r11*8-256] vpermilpd zmm24{k5}, zmm24, zmm31 vpermilpd zmm24{k5}, zmm24, [rbx] vpermilpd zmm24{k5}, zmm24, [rbx]{1to8} vpermilpd zmm24{k5}, zmm24, [rbx+r11*8+256] vpermilpd zmm24{k5}, zmm24, [rbx+r11*8-256] vpermilpd zmm24{k5}{z}, zmm24, zmm31 vpermilpd zmm24{k5}{z}, zmm24, [rbx] vpermilpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vpermilpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermilpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermilpd xmm2, xmm0, 10 vpermilpd xmm2, [rbx], 10 vpermilpd xmm2, [rbx]{1to2}, 10 vpermilpd xmm2, [rbx+r11*8+256], 10 vpermilpd xmm2, [rbx+r11*8-256], 10 vpermilpd xmm2{k5}, xmm0, 10 vpermilpd xmm2{k5}, [rbx], 10 vpermilpd xmm2{k5}, [rbx]{1to2}, 10 vpermilpd xmm2{k5}, [rbx+r11*8+256], 10 vpermilpd xmm2{k5}, [rbx+r11*8-256], 10 vpermilpd xmm2{k5}{z}, xmm0, 10 vpermilpd xmm2{k5}{z}, [rbx], 10 vpermilpd xmm2{k5}{z}, [rbx]{1to2}, 10 vpermilpd xmm2{k5}{z}, [rbx+r11*8+256], 10 vpermilpd xmm2{k5}{z}, [rbx+r11*8-256], 10 vpermilpd ymm16, ymm15, 10 vpermilpd ymm16, [rbx], 10 vpermilpd ymm16, [rbx]{1to4}, 10 vpermilpd ymm16, [rbx+r11*8+256], 10 vpermilpd ymm16, [rbx+r11*8-256], 10 vpermilpd ymm16{k5}, ymm15, 10 vpermilpd ymm16{k5}, [rbx], 10 vpermilpd ymm16{k5}, [rbx]{1to4}, 10 vpermilpd ymm16{k5}, [rbx+r11*8+256], 10 vpermilpd ymm16{k5}, [rbx+r11*8-256], 10 vpermilpd ymm16{k5}{z}, ymm15, 10 vpermilpd ymm16{k5}{z}, [rbx], 10 vpermilpd ymm16{k5}{z}, [rbx]{1to4}, 10 vpermilpd ymm16{k5}{z}, [rbx+r11*8+256], 10 vpermilpd ymm16{k5}{z}, [rbx+r11*8-256], 10 vpermilpd zmm24, zmm31, 10 vpermilpd zmm24, [rbx], 10 vpermilpd zmm24, [rbx]{1to8}, 10 vpermilpd zmm24, [rbx+r11*8+256], 10 vpermilpd zmm24, [rbx+r11*8-256], 10 vpermilpd zmm24{k5}, zmm31, 10 vpermilpd zmm24{k5}, [rbx], 10 vpermilpd zmm24{k5}, [rbx]{1to8}, 10 vpermilpd zmm24{k5}, [rbx+r11*8+256], 10 vpermilpd zmm24{k5}, [rbx+r11*8-256], 10 vpermilpd zmm24{k5}{z}, zmm31, 10 vpermilpd zmm24{k5}{z}, [rbx], 10 vpermilpd zmm24{k5}{z}, [rbx]{1to8}, 10 vpermilpd zmm24{k5}{z}, [rbx+r11*8+256], 10 vpermilpd zmm24{k5}{z}, [rbx+r11*8-256], 10 vpermilps xmm2, xmm7, xmm0 vpermilps xmm2, xmm7, [rbx] vpermilps xmm2, xmm7, [rbx]{1to4} vpermilps xmm2, xmm7, [rbx+r11*8+256] vpermilps xmm2, xmm7, [rbx+r11*8-256] vpermilps xmm2{k5}, xmm7, xmm0 vpermilps xmm2{k5}, xmm7, [rbx] vpermilps xmm2{k5}, xmm7, [rbx]{1to4} vpermilps xmm2{k5}, xmm7, [rbx+r11*8+256] vpermilps xmm2{k5}, xmm7, [rbx+r11*8-256] vpermilps xmm2{k5}{z}, xmm7, xmm0 vpermilps xmm2{k5}{z}, xmm7, [rbx] vpermilps xmm2{k5}{z}, xmm7, [rbx]{1to4} vpermilps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermilps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermilps ymm16, ymm13, ymm15 vpermilps ymm16, ymm13, [rbx] vpermilps ymm16, ymm13, [rbx]{1to8} vpermilps ymm16, ymm13, [rbx+r11*8+256] vpermilps ymm16, ymm13, [rbx+r11*8-256] vpermilps ymm16{k5}, ymm13, ymm15 vpermilps ymm16{k5}, ymm13, [rbx] vpermilps ymm16{k5}, ymm13, [rbx]{1to8} vpermilps ymm16{k5}, ymm13, [rbx+r11*8+256] vpermilps ymm16{k5}, ymm13, [rbx+r11*8-256] vpermilps ymm16{k5}{z}, ymm13, ymm15 vpermilps ymm16{k5}{z}, ymm13, [rbx] vpermilps ymm16{k5}{z}, ymm13, [rbx]{1to8} vpermilps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermilps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermilps zmm24, zmm24, zmm31 vpermilps zmm24, zmm24, [rbx] vpermilps zmm24, zmm24, [rbx]{1to16} vpermilps zmm24, zmm24, [rbx+r11*8+256] vpermilps zmm24, zmm24, [rbx+r11*8-256] vpermilps zmm24{k5}, zmm24, zmm31 vpermilps zmm24{k5}, zmm24, [rbx] vpermilps zmm24{k5}, zmm24, [rbx]{1to16} vpermilps zmm24{k5}, zmm24, [rbx+r11*8+256] vpermilps zmm24{k5}, zmm24, [rbx+r11*8-256] vpermilps zmm24{k5}{z}, zmm24, zmm31 vpermilps zmm24{k5}{z}, zmm24, [rbx] vpermilps zmm24{k5}{z}, zmm24, [rbx]{1to16} vpermilps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermilps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermilps xmm2, xmm0, 10 vpermilps xmm2, [rbx], 10 vpermilps xmm2, [rbx]{1to4}, 10 vpermilps xmm2, [rbx+r11*8+256], 10 vpermilps xmm2, [rbx+r11*8-256], 10 vpermilps xmm2{k5}, xmm0, 10 vpermilps xmm2{k5}, [rbx], 10 vpermilps xmm2{k5}, [rbx]{1to4}, 10 vpermilps xmm2{k5}, [rbx+r11*8+256], 10 vpermilps xmm2{k5}, [rbx+r11*8-256], 10 vpermilps xmm2{k5}{z}, xmm0, 10 vpermilps xmm2{k5}{z}, [rbx], 10 vpermilps xmm2{k5}{z}, [rbx]{1to4}, 10 vpermilps xmm2{k5}{z}, [rbx+r11*8+256], 10 vpermilps xmm2{k5}{z}, [rbx+r11*8-256], 10 vpermilps ymm16, ymm15, 10 vpermilps ymm16, [rbx], 10 vpermilps ymm16, [rbx]{1to8}, 10 vpermilps ymm16, [rbx+r11*8+256], 10 vpermilps ymm16, [rbx+r11*8-256], 10 vpermilps ymm16{k5}, ymm15, 10 vpermilps ymm16{k5}, [rbx], 10 vpermilps ymm16{k5}, [rbx]{1to8}, 10 vpermilps ymm16{k5}, [rbx+r11*8+256], 10 vpermilps ymm16{k5}, [rbx+r11*8-256], 10 vpermilps ymm16{k5}{z}, ymm15, 10 vpermilps ymm16{k5}{z}, [rbx], 10 vpermilps ymm16{k5}{z}, [rbx]{1to8}, 10 vpermilps ymm16{k5}{z}, [rbx+r11*8+256], 10 vpermilps ymm16{k5}{z}, [rbx+r11*8-256], 10 vpermilps zmm24, zmm31, 10 vpermilps zmm24, [rbx], 10 vpermilps zmm24, [rbx]{1to16}, 10 vpermilps zmm24, [rbx+r11*8+256], 10 vpermilps zmm24, [rbx+r11*8-256], 10 vpermilps zmm24{k5}, zmm31, 10 vpermilps zmm24{k5}, [rbx], 10 vpermilps zmm24{k5}, [rbx]{1to16}, 10 vpermilps zmm24{k5}, [rbx+r11*8+256], 10 vpermilps zmm24{k5}, [rbx+r11*8-256], 10 vpermilps zmm24{k5}{z}, zmm31, 10 vpermilps zmm24{k5}{z}, [rbx], 10 vpermilps zmm24{k5}{z}, [rbx]{1to16}, 10 vpermilps zmm24{k5}{z}, [rbx+r11*8+256], 10 vpermilps zmm24{k5}{z}, [rbx+r11*8-256], 10 vpermpd ymm16, ymm13, ymm15 vpermpd ymm16, ymm13, [rbx] vpermpd ymm16, ymm13, [rbx]{1to4} vpermpd ymm16, ymm13, [rbx+r11*8+256] vpermpd ymm16, ymm13, [rbx+r11*8-256] vpermpd ymm16{k5}, ymm13, ymm15 vpermpd ymm16{k5}, ymm13, [rbx] vpermpd ymm16{k5}, ymm13, [rbx]{1to4} vpermpd ymm16{k5}, ymm13, [rbx+r11*8+256] vpermpd ymm16{k5}, ymm13, [rbx+r11*8-256] vpermpd ymm16{k5}{z}, ymm13, ymm15 vpermpd ymm16{k5}{z}, ymm13, [rbx] vpermpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vpermpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermpd zmm24, zmm24, zmm31 vpermpd zmm24, zmm24, [rbx] vpermpd zmm24, zmm24, [rbx]{1to8} vpermpd zmm24, zmm24, [rbx+r11*8+256] vpermpd zmm24, zmm24, [rbx+r11*8-256] vpermpd zmm24{k5}, zmm24, zmm31 vpermpd zmm24{k5}, zmm24, [rbx] vpermpd zmm24{k5}, zmm24, [rbx]{1to8} vpermpd zmm24{k5}, zmm24, [rbx+r11*8+256] vpermpd zmm24{k5}, zmm24, [rbx+r11*8-256] vpermpd zmm24{k5}{z}, zmm24, zmm31 vpermpd zmm24{k5}{z}, zmm24, [rbx] vpermpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vpermpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermpd ymm16, ymm13, ymm15 vpermpd ymm16, ymm13, [rbx] vpermpd ymm16, ymm13, [rbx]{1to4} vpermpd ymm16, ymm13, [rbx+r11*8+256] vpermpd ymm16, ymm13, [rbx+r11*8-256] vpermpd ymm16{k5}, ymm13, ymm15 vpermpd ymm16{k5}, ymm13, [rbx] vpermpd ymm16{k5}, ymm13, [rbx]{1to4} vpermpd ymm16{k5}, ymm13, [rbx+r11*8+256] vpermpd ymm16{k5}, ymm13, [rbx+r11*8-256] vpermpd ymm16{k5}{z}, ymm13, ymm15 vpermpd ymm16{k5}{z}, ymm13, [rbx] vpermpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vpermpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermpd zmm24, zmm24, zmm31 vpermpd zmm24, zmm24, [rbx] vpermpd zmm24, zmm24, [rbx]{1to8} vpermpd zmm24, zmm24, [rbx+r11*8+256] vpermpd zmm24, zmm24, [rbx+r11*8-256] vpermpd zmm24{k5}, zmm24, zmm31 vpermpd zmm24{k5}, zmm24, [rbx] vpermpd zmm24{k5}, zmm24, [rbx]{1to8} vpermpd zmm24{k5}, zmm24, [rbx+r11*8+256] vpermpd zmm24{k5}, zmm24, [rbx+r11*8-256] vpermpd zmm24{k5}{z}, zmm24, zmm31 vpermpd zmm24{k5}{z}, zmm24, [rbx] vpermpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vpermpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermpd ymm16, ymm15, 10 vpermpd ymm16, [rbx], 10 vpermpd ymm16, [rbx]{1to4}, 10 vpermpd ymm16, [rbx+r11*8+256], 10 vpermpd ymm16, [rbx+r11*8-256], 10 vpermpd ymm16{k5}, ymm15, 10 vpermpd ymm16{k5}, [rbx], 10 vpermpd ymm16{k5}, [rbx]{1to4}, 10 vpermpd ymm16{k5}, [rbx+r11*8+256], 10 vpermpd ymm16{k5}, [rbx+r11*8-256], 10 vpermpd ymm16{k5}{z}, ymm15, 10 vpermpd ymm16{k5}{z}, [rbx], 10 vpermpd ymm16{k5}{z}, [rbx]{1to4}, 10 vpermpd ymm16{k5}{z}, [rbx+r11*8+256], 10 vpermpd ymm16{k5}{z}, [rbx+r11*8-256], 10 vpermpd zmm24, zmm31, 10 vpermpd zmm24, [rbx], 10 vpermpd zmm24, [rbx]{1to8}, 10 vpermpd zmm24, [rbx+r11*8+256], 10 vpermpd zmm24, [rbx+r11*8-256], 10 vpermpd zmm24{k5}, zmm31, 10 vpermpd zmm24{k5}, [rbx], 10 vpermpd zmm24{k5}, [rbx]{1to8}, 10 vpermpd zmm24{k5}, [rbx+r11*8+256], 10 vpermpd zmm24{k5}, [rbx+r11*8-256], 10 vpermpd zmm24{k5}{z}, zmm31, 10 vpermpd zmm24{k5}{z}, [rbx], 10 vpermpd zmm24{k5}{z}, [rbx]{1to8}, 10 vpermpd zmm24{k5}{z}, [rbx+r11*8+256], 10 vpermpd zmm24{k5}{z}, [rbx+r11*8-256], 10 vpermps ymm16, ymm13, ymm15 vpermps ymm16, ymm13, [rbx] vpermps ymm16, ymm13, [rbx]{1to8} vpermps ymm16, ymm13, [rbx+r11*8+256] vpermps ymm16, ymm13, [rbx+r11*8-256] vpermps ymm16{k5}, ymm13, ymm15 vpermps ymm16{k5}, ymm13, [rbx] vpermps ymm16{k5}, ymm13, [rbx]{1to8} vpermps ymm16{k5}, ymm13, [rbx+r11*8+256] vpermps ymm16{k5}, ymm13, [rbx+r11*8-256] vpermps ymm16{k5}{z}, ymm13, ymm15 vpermps ymm16{k5}{z}, ymm13, [rbx] vpermps ymm16{k5}{z}, ymm13, [rbx]{1to8} vpermps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermps zmm24, zmm24, zmm31 vpermps zmm24, zmm24, [rbx] vpermps zmm24, zmm24, [rbx]{1to16} vpermps zmm24, zmm24, [rbx+r11*8+256] vpermps zmm24, zmm24, [rbx+r11*8-256] vpermps zmm24{k5}, zmm24, zmm31 vpermps zmm24{k5}, zmm24, [rbx] vpermps zmm24{k5}, zmm24, [rbx]{1to16} vpermps zmm24{k5}, zmm24, [rbx+r11*8+256] vpermps zmm24{k5}, zmm24, [rbx+r11*8-256] vpermps zmm24{k5}{z}, zmm24, zmm31 vpermps zmm24{k5}{z}, zmm24, [rbx] vpermps zmm24{k5}{z}, zmm24, [rbx]{1to16} vpermps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermps ymm16, ymm13, ymm15 vpermps ymm16, ymm13, [rbx] vpermps ymm16, ymm13, [rbx]{1to8} vpermps ymm16, ymm13, [rbx+r11*8+256] vpermps ymm16, ymm13, [rbx+r11*8-256] vpermps ymm16{k5}, ymm13, ymm15 vpermps ymm16{k5}, ymm13, [rbx] vpermps ymm16{k5}, ymm13, [rbx]{1to8} vpermps ymm16{k5}, ymm13, [rbx+r11*8+256] vpermps ymm16{k5}, ymm13, [rbx+r11*8-256] vpermps ymm16{k5}{z}, ymm13, ymm15 vpermps ymm16{k5}{z}, ymm13, [rbx] vpermps ymm16{k5}{z}, ymm13, [rbx]{1to8} vpermps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermps zmm24, zmm24, zmm31 vpermps zmm24, zmm24, [rbx] vpermps zmm24, zmm24, [rbx]{1to16} vpermps zmm24, zmm24, [rbx+r11*8+256] vpermps zmm24, zmm24, [rbx+r11*8-256] vpermps zmm24{k5}, zmm24, zmm31 vpermps zmm24{k5}, zmm24, [rbx] vpermps zmm24{k5}, zmm24, [rbx]{1to16} vpermps zmm24{k5}, zmm24, [rbx+r11*8+256] vpermps zmm24{k5}, zmm24, [rbx+r11*8-256] vpermps zmm24{k5}{z}, zmm24, zmm31 vpermps zmm24{k5}{z}, zmm24, [rbx] vpermps zmm24{k5}{z}, zmm24, [rbx]{1to16} vpermps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermq ymm16, ymm13, ymm15 vpermq ymm16, ymm13, [rbx] vpermq ymm16, ymm13, [rbx]{1to4} vpermq ymm16, ymm13, [rbx+r11*8+256] vpermq ymm16, ymm13, [rbx+r11*8-256] vpermq ymm16{k5}, ymm13, ymm15 vpermq ymm16{k5}, ymm13, [rbx] vpermq ymm16{k5}, ymm13, [rbx]{1to4} vpermq ymm16{k5}, ymm13, [rbx+r11*8+256] vpermq ymm16{k5}, ymm13, [rbx+r11*8-256] vpermq ymm16{k5}{z}, ymm13, ymm15 vpermq ymm16{k5}{z}, ymm13, [rbx] vpermq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpermq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermq zmm24, zmm24, zmm31 vpermq zmm24, zmm24, [rbx] vpermq zmm24, zmm24, [rbx]{1to8} vpermq zmm24, zmm24, [rbx+r11*8+256] vpermq zmm24, zmm24, [rbx+r11*8-256] vpermq zmm24{k5}, zmm24, zmm31 vpermq zmm24{k5}, zmm24, [rbx] vpermq zmm24{k5}, zmm24, [rbx]{1to8} vpermq zmm24{k5}, zmm24, [rbx+r11*8+256] vpermq zmm24{k5}, zmm24, [rbx+r11*8-256] vpermq zmm24{k5}{z}, zmm24, zmm31 vpermq zmm24{k5}{z}, zmm24, [rbx] vpermq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpermq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermq ymm16, ymm15, 10 vpermq ymm16, [rbx], 10 vpermq ymm16, [rbx]{1to4}, 10 vpermq ymm16, [rbx+r11*8+256], 10 vpermq ymm16, [rbx+r11*8-256], 10 vpermq ymm16{k5}, ymm15, 10 vpermq ymm16{k5}, [rbx], 10 vpermq ymm16{k5}, [rbx]{1to4}, 10 vpermq ymm16{k5}, [rbx+r11*8+256], 10 vpermq ymm16{k5}, [rbx+r11*8-256], 10 vpermq ymm16{k5}{z}, ymm15, 10 vpermq ymm16{k5}{z}, [rbx], 10 vpermq ymm16{k5}{z}, [rbx]{1to4}, 10 vpermq ymm16{k5}{z}, [rbx+r11*8+256], 10 vpermq ymm16{k5}{z}, [rbx+r11*8-256], 10 vpermq zmm24, zmm31, 10 vpermq zmm24, [rbx], 10 vpermq zmm24, [rbx]{1to8}, 10 vpermq zmm24, [rbx+r11*8+256], 10 vpermq zmm24, [rbx+r11*8-256], 10 vpermq zmm24{k5}, zmm31, 10 vpermq zmm24{k5}, [rbx], 10 vpermq zmm24{k5}, [rbx]{1to8}, 10 vpermq zmm24{k5}, [rbx+r11*8+256], 10 vpermq zmm24{k5}, [rbx+r11*8-256], 10 vpermq zmm24{k5}{z}, zmm31, 10 vpermq zmm24{k5}{z}, [rbx], 10 vpermq zmm24{k5}{z}, [rbx]{1to8}, 10 vpermq zmm24{k5}{z}, [rbx+r11*8+256], 10 vpermq zmm24{k5}{z}, [rbx+r11*8-256], 10 vpermt2d xmm2, xmm7, xmm0 vpermt2d xmm2, xmm7, [rbx] vpermt2d xmm2, xmm7, [rbx]{1to4} vpermt2d xmm2, xmm7, [rbx+r11*8+256] vpermt2d xmm2, xmm7, [rbx+r11*8-256] vpermt2d xmm2{k5}, xmm7, xmm0 vpermt2d xmm2{k5}, xmm7, [rbx] vpermt2d xmm2{k5}, xmm7, [rbx]{1to4} vpermt2d xmm2{k5}, xmm7, [rbx+r11*8+256] vpermt2d xmm2{k5}, xmm7, [rbx+r11*8-256] vpermt2d xmm2{k5}{z}, xmm7, xmm0 vpermt2d xmm2{k5}{z}, xmm7, [rbx] vpermt2d xmm2{k5}{z}, xmm7, [rbx]{1to4} vpermt2d xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermt2d xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermt2d ymm16, ymm13, ymm15 vpermt2d ymm16, ymm13, [rbx] vpermt2d ymm16, ymm13, [rbx]{1to8} vpermt2d ymm16, ymm13, [rbx+r11*8+256] vpermt2d ymm16, ymm13, [rbx+r11*8-256] vpermt2d ymm16{k5}, ymm13, ymm15 vpermt2d ymm16{k5}, ymm13, [rbx] vpermt2d ymm16{k5}, ymm13, [rbx]{1to8} vpermt2d ymm16{k5}, ymm13, [rbx+r11*8+256] vpermt2d ymm16{k5}, ymm13, [rbx+r11*8-256] vpermt2d ymm16{k5}{z}, ymm13, ymm15 vpermt2d ymm16{k5}{z}, ymm13, [rbx] vpermt2d ymm16{k5}{z}, ymm13, [rbx]{1to8} vpermt2d ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermt2d ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermt2d zmm24, zmm24, zmm31 vpermt2d zmm24, zmm24, [rbx] vpermt2d zmm24, zmm24, [rbx]{1to16} vpermt2d zmm24, zmm24, [rbx+r11*8+256] vpermt2d zmm24, zmm24, [rbx+r11*8-256] vpermt2d zmm24{k5}, zmm24, zmm31 vpermt2d zmm24{k5}, zmm24, [rbx] vpermt2d zmm24{k5}, zmm24, [rbx]{1to16} vpermt2d zmm24{k5}, zmm24, [rbx+r11*8+256] vpermt2d zmm24{k5}, zmm24, [rbx+r11*8-256] vpermt2d zmm24{k5}{z}, zmm24, zmm31 vpermt2d zmm24{k5}{z}, zmm24, [rbx] vpermt2d zmm24{k5}{z}, zmm24, [rbx]{1to16} vpermt2d zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermt2d zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermt2pd xmm2, xmm7, xmm0 vpermt2pd xmm2, xmm7, [rbx] vpermt2pd xmm2, xmm7, [rbx]{1to2} vpermt2pd xmm2, xmm7, [rbx+r11*8+256] vpermt2pd xmm2, xmm7, [rbx+r11*8-256] vpermt2pd xmm2{k5}, xmm7, xmm0 vpermt2pd xmm2{k5}, xmm7, [rbx] vpermt2pd xmm2{k5}, xmm7, [rbx]{1to2} vpermt2pd xmm2{k5}, xmm7, [rbx+r11*8+256] vpermt2pd xmm2{k5}, xmm7, [rbx+r11*8-256] vpermt2pd xmm2{k5}{z}, xmm7, xmm0 vpermt2pd xmm2{k5}{z}, xmm7, [rbx] vpermt2pd xmm2{k5}{z}, xmm7, [rbx]{1to2} vpermt2pd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermt2pd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermt2pd ymm16, ymm13, ymm15 vpermt2pd ymm16, ymm13, [rbx] vpermt2pd ymm16, ymm13, [rbx]{1to4} vpermt2pd ymm16, ymm13, [rbx+r11*8+256] vpermt2pd ymm16, ymm13, [rbx+r11*8-256] vpermt2pd ymm16{k5}, ymm13, ymm15 vpermt2pd ymm16{k5}, ymm13, [rbx] vpermt2pd ymm16{k5}, ymm13, [rbx]{1to4} vpermt2pd ymm16{k5}, ymm13, [rbx+r11*8+256] vpermt2pd ymm16{k5}, ymm13, [rbx+r11*8-256] vpermt2pd ymm16{k5}{z}, ymm13, ymm15 vpermt2pd ymm16{k5}{z}, ymm13, [rbx] vpermt2pd ymm16{k5}{z}, ymm13, [rbx]{1to4} vpermt2pd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermt2pd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermt2pd zmm24, zmm24, zmm31 vpermt2pd zmm24, zmm24, [rbx] vpermt2pd zmm24, zmm24, [rbx]{1to8} vpermt2pd zmm24, zmm24, [rbx+r11*8+256] vpermt2pd zmm24, zmm24, [rbx+r11*8-256] vpermt2pd zmm24{k5}, zmm24, zmm31 vpermt2pd zmm24{k5}, zmm24, [rbx] vpermt2pd zmm24{k5}, zmm24, [rbx]{1to8} vpermt2pd zmm24{k5}, zmm24, [rbx+r11*8+256] vpermt2pd zmm24{k5}, zmm24, [rbx+r11*8-256] vpermt2pd zmm24{k5}{z}, zmm24, zmm31 vpermt2pd zmm24{k5}{z}, zmm24, [rbx] vpermt2pd zmm24{k5}{z}, zmm24, [rbx]{1to8} vpermt2pd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermt2pd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermt2ps xmm2, xmm7, xmm0 vpermt2ps xmm2, xmm7, [rbx] vpermt2ps xmm2, xmm7, [rbx]{1to4} vpermt2ps xmm2, xmm7, [rbx+r11*8+256] vpermt2ps xmm2, xmm7, [rbx+r11*8-256] vpermt2ps xmm2{k5}, xmm7, xmm0 vpermt2ps xmm2{k5}, xmm7, [rbx] vpermt2ps xmm2{k5}, xmm7, [rbx]{1to4} vpermt2ps xmm2{k5}, xmm7, [rbx+r11*8+256] vpermt2ps xmm2{k5}, xmm7, [rbx+r11*8-256] vpermt2ps xmm2{k5}{z}, xmm7, xmm0 vpermt2ps xmm2{k5}{z}, xmm7, [rbx] vpermt2ps xmm2{k5}{z}, xmm7, [rbx]{1to4} vpermt2ps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermt2ps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermt2ps ymm16, ymm13, ymm15 vpermt2ps ymm16, ymm13, [rbx] vpermt2ps ymm16, ymm13, [rbx]{1to8} vpermt2ps ymm16, ymm13, [rbx+r11*8+256] vpermt2ps ymm16, ymm13, [rbx+r11*8-256] vpermt2ps ymm16{k5}, ymm13, ymm15 vpermt2ps ymm16{k5}, ymm13, [rbx] vpermt2ps ymm16{k5}, ymm13, [rbx]{1to8} vpermt2ps ymm16{k5}, ymm13, [rbx+r11*8+256] vpermt2ps ymm16{k5}, ymm13, [rbx+r11*8-256] vpermt2ps ymm16{k5}{z}, ymm13, ymm15 vpermt2ps ymm16{k5}{z}, ymm13, [rbx] vpermt2ps ymm16{k5}{z}, ymm13, [rbx]{1to8} vpermt2ps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermt2ps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermt2ps zmm24, zmm24, zmm31 vpermt2ps zmm24, zmm24, [rbx] vpermt2ps zmm24, zmm24, [rbx]{1to16} vpermt2ps zmm24, zmm24, [rbx+r11*8+256] vpermt2ps zmm24, zmm24, [rbx+r11*8-256] vpermt2ps zmm24{k5}, zmm24, zmm31 vpermt2ps zmm24{k5}, zmm24, [rbx] vpermt2ps zmm24{k5}, zmm24, [rbx]{1to16} vpermt2ps zmm24{k5}, zmm24, [rbx+r11*8+256] vpermt2ps zmm24{k5}, zmm24, [rbx+r11*8-256] vpermt2ps zmm24{k5}{z}, zmm24, zmm31 vpermt2ps zmm24{k5}{z}, zmm24, [rbx] vpermt2ps zmm24{k5}{z}, zmm24, [rbx]{1to16} vpermt2ps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermt2ps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpermt2q xmm2, xmm7, xmm0 vpermt2q xmm2, xmm7, [rbx] vpermt2q xmm2, xmm7, [rbx]{1to2} vpermt2q xmm2, xmm7, [rbx+r11*8+256] vpermt2q xmm2, xmm7, [rbx+r11*8-256] vpermt2q xmm2{k5}, xmm7, xmm0 vpermt2q xmm2{k5}, xmm7, [rbx] vpermt2q xmm2{k5}, xmm7, [rbx]{1to2} vpermt2q xmm2{k5}, xmm7, [rbx+r11*8+256] vpermt2q xmm2{k5}, xmm7, [rbx+r11*8-256] vpermt2q xmm2{k5}{z}, xmm7, xmm0 vpermt2q xmm2{k5}{z}, xmm7, [rbx] vpermt2q xmm2{k5}{z}, xmm7, [rbx]{1to2} vpermt2q xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpermt2q xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpermt2q ymm16, ymm13, ymm15 vpermt2q ymm16, ymm13, [rbx] vpermt2q ymm16, ymm13, [rbx]{1to4} vpermt2q ymm16, ymm13, [rbx+r11*8+256] vpermt2q ymm16, ymm13, [rbx+r11*8-256] vpermt2q ymm16{k5}, ymm13, ymm15 vpermt2q ymm16{k5}, ymm13, [rbx] vpermt2q ymm16{k5}, ymm13, [rbx]{1to4} vpermt2q ymm16{k5}, ymm13, [rbx+r11*8+256] vpermt2q ymm16{k5}, ymm13, [rbx+r11*8-256] vpermt2q ymm16{k5}{z}, ymm13, ymm15 vpermt2q ymm16{k5}{z}, ymm13, [rbx] vpermt2q ymm16{k5}{z}, ymm13, [rbx]{1to4} vpermt2q ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpermt2q ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpermt2q zmm24, zmm24, zmm31 vpermt2q zmm24, zmm24, [rbx] vpermt2q zmm24, zmm24, [rbx]{1to8} vpermt2q zmm24, zmm24, [rbx+r11*8+256] vpermt2q zmm24, zmm24, [rbx+r11*8-256] vpermt2q zmm24{k5}, zmm24, zmm31 vpermt2q zmm24{k5}, zmm24, [rbx] vpermt2q zmm24{k5}, zmm24, [rbx]{1to8} vpermt2q zmm24{k5}, zmm24, [rbx+r11*8+256] vpermt2q zmm24{k5}, zmm24, [rbx+r11*8-256] vpermt2q zmm24{k5}{z}, zmm24, zmm31 vpermt2q zmm24{k5}{z}, zmm24, [rbx] vpermt2q zmm24{k5}{z}, zmm24, [rbx]{1to8} vpermt2q zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpermt2q zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpexpandd xmm2, xmm0 vpexpandd xmm2, [rbx] vpexpandd xmm2, [rbx+r11*8+256] vpexpandd xmm2, [rbx+r11*8-256] vpexpandd xmm2{k5}, xmm0 vpexpandd xmm2{k5}, [rbx] vpexpandd xmm2{k5}, [rbx+r11*8+256] vpexpandd xmm2{k5}, [rbx+r11*8-256] vpexpandd xmm2{k5}{z}, xmm0 vpexpandd xmm2{k5}{z}, [rbx] vpexpandd xmm2{k5}{z}, [rbx+r11*8+256] vpexpandd xmm2{k5}{z}, [rbx+r11*8-256] vpexpandd ymm16, ymm15 vpexpandd ymm16, [rbx] vpexpandd ymm16, [rbx+r11*8+256] vpexpandd ymm16, [rbx+r11*8-256] vpexpandd ymm16{k5}, ymm15 vpexpandd ymm16{k5}, [rbx] vpexpandd ymm16{k5}, [rbx+r11*8+256] vpexpandd ymm16{k5}, [rbx+r11*8-256] vpexpandd ymm16{k5}{z}, ymm15 vpexpandd ymm16{k5}{z}, [rbx] vpexpandd ymm16{k5}{z}, [rbx+r11*8+256] vpexpandd ymm16{k5}{z}, [rbx+r11*8-256] vpexpandd zmm24, zmm31 vpexpandd zmm24, [rbx] vpexpandd zmm24, [rbx+r11*8+256] vpexpandd zmm24, [rbx+r11*8-256] vpexpandd zmm24{k5}, zmm31 vpexpandd zmm24{k5}, [rbx] vpexpandd zmm24{k5}, [rbx+r11*8+256] vpexpandd zmm24{k5}, [rbx+r11*8-256] vpexpandd zmm24{k5}{z}, zmm31 vpexpandd zmm24{k5}{z}, [rbx] vpexpandd zmm24{k5}{z}, [rbx+r11*8+256] vpexpandd zmm24{k5}{z}, [rbx+r11*8-256] vpexpandq xmm2, xmm0 vpexpandq xmm2, [rbx] vpexpandq xmm2, [rbx+r11*8+256] vpexpandq xmm2, [rbx+r11*8-256] vpexpandq xmm2{k5}, xmm0 vpexpandq xmm2{k5}, [rbx] vpexpandq xmm2{k5}, [rbx+r11*8+256] vpexpandq xmm2{k5}, [rbx+r11*8-256] vpexpandq xmm2{k5}{z}, xmm0 vpexpandq xmm2{k5}{z}, [rbx] vpexpandq xmm2{k5}{z}, [rbx+r11*8+256] vpexpandq xmm2{k5}{z}, [rbx+r11*8-256] vpexpandq ymm16, ymm15 vpexpandq ymm16, [rbx] vpexpandq ymm16, [rbx+r11*8+256] vpexpandq ymm16, [rbx+r11*8-256] vpexpandq ymm16{k5}, ymm15 vpexpandq ymm16{k5}, [rbx] vpexpandq ymm16{k5}, [rbx+r11*8+256] vpexpandq ymm16{k5}, [rbx+r11*8-256] vpexpandq ymm16{k5}{z}, ymm15 vpexpandq ymm16{k5}{z}, [rbx] vpexpandq ymm16{k5}{z}, [rbx+r11*8+256] vpexpandq ymm16{k5}{z}, [rbx+r11*8-256] vpexpandq zmm24, zmm31 vpexpandq zmm24, [rbx] vpexpandq zmm24, [rbx+r11*8+256] vpexpandq zmm24, [rbx+r11*8-256] vpexpandq zmm24{k5}, zmm31 vpexpandq zmm24{k5}, [rbx] vpexpandq zmm24{k5}, [rbx+r11*8+256] vpexpandq zmm24{k5}, [rbx+r11*8-256] vpexpandq zmm24{k5}{z}, zmm31 vpexpandq zmm24{k5}{z}, [rbx] vpexpandq zmm24{k5}{z}, [rbx+r11*8+256] vpexpandq zmm24{k5}{z}, [rbx+r11*8-256] vpmaxsd xmm2, xmm7, xmm0 vpmaxsd xmm2, xmm7, [rbx] vpmaxsd xmm2, xmm7, [rbx]{1to4} vpmaxsd xmm2, xmm7, [rbx+r11*8+256] vpmaxsd xmm2, xmm7, [rbx+r11*8-256] vpmaxsd xmm2{k5}, xmm7, xmm0 vpmaxsd xmm2{k5}, xmm7, [rbx] vpmaxsd xmm2{k5}, xmm7, [rbx]{1to4} vpmaxsd xmm2{k5}, xmm7, [rbx+r11*8+256] vpmaxsd xmm2{k5}, xmm7, [rbx+r11*8-256] vpmaxsd xmm2{k5}{z}, xmm7, xmm0 vpmaxsd xmm2{k5}{z}, xmm7, [rbx] vpmaxsd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpmaxsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpmaxsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpmaxsd ymm16, ymm13, ymm15 vpmaxsd ymm16, ymm13, [rbx] vpmaxsd ymm16, ymm13, [rbx]{1to8} vpmaxsd ymm16, ymm13, [rbx+r11*8+256] vpmaxsd ymm16, ymm13, [rbx+r11*8-256] vpmaxsd ymm16{k5}, ymm13, ymm15 vpmaxsd ymm16{k5}, ymm13, [rbx] vpmaxsd ymm16{k5}, ymm13, [rbx]{1to8} vpmaxsd ymm16{k5}, ymm13, [rbx+r11*8+256] vpmaxsd ymm16{k5}, ymm13, [rbx+r11*8-256] vpmaxsd ymm16{k5}{z}, ymm13, ymm15 vpmaxsd ymm16{k5}{z}, ymm13, [rbx] vpmaxsd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpmaxsd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpmaxsd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpmaxsd zmm24, zmm24, zmm31 vpmaxsd zmm24, zmm24, [rbx] vpmaxsd zmm24, zmm24, [rbx]{1to16} vpmaxsd zmm24, zmm24, [rbx+r11*8+256] vpmaxsd zmm24, zmm24, [rbx+r11*8-256] vpmaxsd zmm24{k5}, zmm24, zmm31 vpmaxsd zmm24{k5}, zmm24, [rbx] vpmaxsd zmm24{k5}, zmm24, [rbx]{1to16} vpmaxsd zmm24{k5}, zmm24, [rbx+r11*8+256] vpmaxsd zmm24{k5}, zmm24, [rbx+r11*8-256] vpmaxsd zmm24{k5}{z}, zmm24, zmm31 vpmaxsd zmm24{k5}{z}, zmm24, [rbx] vpmaxsd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpmaxsd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpmaxsd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpmaxsq xmm2, xmm7, xmm0 vpmaxsq xmm2, xmm7, [rbx] vpmaxsq xmm2, xmm7, [rbx]{1to2} vpmaxsq xmm2, xmm7, [rbx+r11*8+256] vpmaxsq xmm2, xmm7, [rbx+r11*8-256] vpmaxsq xmm2{k5}, xmm7, xmm0 vpmaxsq xmm2{k5}, xmm7, [rbx] vpmaxsq xmm2{k5}, xmm7, [rbx]{1to2} vpmaxsq xmm2{k5}, xmm7, [rbx+r11*8+256] vpmaxsq xmm2{k5}, xmm7, [rbx+r11*8-256] vpmaxsq xmm2{k5}{z}, xmm7, xmm0 vpmaxsq xmm2{k5}{z}, xmm7, [rbx] vpmaxsq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpmaxsq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpmaxsq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpmaxsq ymm16, ymm13, ymm15 vpmaxsq ymm16, ymm13, [rbx] vpmaxsq ymm16, ymm13, [rbx]{1to4} vpmaxsq ymm16, ymm13, [rbx+r11*8+256] vpmaxsq ymm16, ymm13, [rbx+r11*8-256] vpmaxsq ymm16{k5}, ymm13, ymm15 vpmaxsq ymm16{k5}, ymm13, [rbx] vpmaxsq ymm16{k5}, ymm13, [rbx]{1to4} vpmaxsq ymm16{k5}, ymm13, [rbx+r11*8+256] vpmaxsq ymm16{k5}, ymm13, [rbx+r11*8-256] vpmaxsq ymm16{k5}{z}, ymm13, ymm15 vpmaxsq ymm16{k5}{z}, ymm13, [rbx] vpmaxsq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpmaxsq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpmaxsq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpmaxsq zmm24, zmm24, zmm31 vpmaxsq zmm24, zmm24, [rbx] vpmaxsq zmm24, zmm24, [rbx]{1to8} vpmaxsq zmm24, zmm24, [rbx+r11*8+256] vpmaxsq zmm24, zmm24, [rbx+r11*8-256] vpmaxsq zmm24{k5}, zmm24, zmm31 vpmaxsq zmm24{k5}, zmm24, [rbx] vpmaxsq zmm24{k5}, zmm24, [rbx]{1to8} vpmaxsq zmm24{k5}, zmm24, [rbx+r11*8+256] vpmaxsq zmm24{k5}, zmm24, [rbx+r11*8-256] vpmaxsq zmm24{k5}{z}, zmm24, zmm31 vpmaxsq zmm24{k5}{z}, zmm24, [rbx] vpmaxsq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpmaxsq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpmaxsq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpmaxud xmm2, xmm7, xmm0 vpmaxud xmm2, xmm7, [rbx] vpmaxud xmm2, xmm7, [rbx]{1to4} vpmaxud xmm2, xmm7, [rbx+r11*8+256] vpmaxud xmm2, xmm7, [rbx+r11*8-256] vpmaxud xmm2{k5}, xmm7, xmm0 vpmaxud xmm2{k5}, xmm7, [rbx] vpmaxud xmm2{k5}, xmm7, [rbx]{1to4} vpmaxud xmm2{k5}, xmm7, [rbx+r11*8+256] vpmaxud xmm2{k5}, xmm7, [rbx+r11*8-256] vpmaxud xmm2{k5}{z}, xmm7, xmm0 vpmaxud xmm2{k5}{z}, xmm7, [rbx] vpmaxud xmm2{k5}{z}, xmm7, [rbx]{1to4} vpmaxud xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpmaxud xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpmaxud ymm16, ymm13, ymm15 vpmaxud ymm16, ymm13, [rbx] vpmaxud ymm16, ymm13, [rbx]{1to8} vpmaxud ymm16, ymm13, [rbx+r11*8+256] vpmaxud ymm16, ymm13, [rbx+r11*8-256] vpmaxud ymm16{k5}, ymm13, ymm15 vpmaxud ymm16{k5}, ymm13, [rbx] vpmaxud ymm16{k5}, ymm13, [rbx]{1to8} vpmaxud ymm16{k5}, ymm13, [rbx+r11*8+256] vpmaxud ymm16{k5}, ymm13, [rbx+r11*8-256] vpmaxud ymm16{k5}{z}, ymm13, ymm15 vpmaxud ymm16{k5}{z}, ymm13, [rbx] vpmaxud ymm16{k5}{z}, ymm13, [rbx]{1to8} vpmaxud ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpmaxud ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpmaxud zmm24, zmm24, zmm31 vpmaxud zmm24, zmm24, [rbx] vpmaxud zmm24, zmm24, [rbx]{1to16} vpmaxud zmm24, zmm24, [rbx+r11*8+256] vpmaxud zmm24, zmm24, [rbx+r11*8-256] vpmaxud zmm24{k5}, zmm24, zmm31 vpmaxud zmm24{k5}, zmm24, [rbx] vpmaxud zmm24{k5}, zmm24, [rbx]{1to16} vpmaxud zmm24{k5}, zmm24, [rbx+r11*8+256] vpmaxud zmm24{k5}, zmm24, [rbx+r11*8-256] vpmaxud zmm24{k5}{z}, zmm24, zmm31 vpmaxud zmm24{k5}{z}, zmm24, [rbx] vpmaxud zmm24{k5}{z}, zmm24, [rbx]{1to16} vpmaxud zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpmaxud zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpmaxuq xmm2, xmm7, xmm0 vpmaxuq xmm2, xmm7, [rbx] vpmaxuq xmm2, xmm7, [rbx]{1to2} vpmaxuq xmm2, xmm7, [rbx+r11*8+256] vpmaxuq xmm2, xmm7, [rbx+r11*8-256] vpmaxuq xmm2{k5}, xmm7, xmm0 vpmaxuq xmm2{k5}, xmm7, [rbx] vpmaxuq xmm2{k5}, xmm7, [rbx]{1to2} vpmaxuq xmm2{k5}, xmm7, [rbx+r11*8+256] vpmaxuq xmm2{k5}, xmm7, [rbx+r11*8-256] vpmaxuq xmm2{k5}{z}, xmm7, xmm0 vpmaxuq xmm2{k5}{z}, xmm7, [rbx] vpmaxuq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpmaxuq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpmaxuq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpmaxuq ymm16, ymm13, ymm15 vpmaxuq ymm16, ymm13, [rbx] vpmaxuq ymm16, ymm13, [rbx]{1to4} vpmaxuq ymm16, ymm13, [rbx+r11*8+256] vpmaxuq ymm16, ymm13, [rbx+r11*8-256] vpmaxuq ymm16{k5}, ymm13, ymm15 vpmaxuq ymm16{k5}, ymm13, [rbx] vpmaxuq ymm16{k5}, ymm13, [rbx]{1to4} vpmaxuq ymm16{k5}, ymm13, [rbx+r11*8+256] vpmaxuq ymm16{k5}, ymm13, [rbx+r11*8-256] vpmaxuq ymm16{k5}{z}, ymm13, ymm15 vpmaxuq ymm16{k5}{z}, ymm13, [rbx] vpmaxuq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpmaxuq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpmaxuq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpmaxuq zmm24, zmm24, zmm31 vpmaxuq zmm24, zmm24, [rbx] vpmaxuq zmm24, zmm24, [rbx]{1to8} vpmaxuq zmm24, zmm24, [rbx+r11*8+256] vpmaxuq zmm24, zmm24, [rbx+r11*8-256] vpmaxuq zmm24{k5}, zmm24, zmm31 vpmaxuq zmm24{k5}, zmm24, [rbx] vpmaxuq zmm24{k5}, zmm24, [rbx]{1to8} vpmaxuq zmm24{k5}, zmm24, [rbx+r11*8+256] vpmaxuq zmm24{k5}, zmm24, [rbx+r11*8-256] vpmaxuq zmm24{k5}{z}, zmm24, zmm31 vpmaxuq zmm24{k5}{z}, zmm24, [rbx] vpmaxuq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpmaxuq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpmaxuq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpminsd xmm2, xmm7, xmm0 vpminsd xmm2, xmm7, [rbx] vpminsd xmm2, xmm7, [rbx]{1to4} vpminsd xmm2, xmm7, [rbx+r11*8+256] vpminsd xmm2, xmm7, [rbx+r11*8-256] vpminsd xmm2{k5}, xmm7, xmm0 vpminsd xmm2{k5}, xmm7, [rbx] vpminsd xmm2{k5}, xmm7, [rbx]{1to4} vpminsd xmm2{k5}, xmm7, [rbx+r11*8+256] vpminsd xmm2{k5}, xmm7, [rbx+r11*8-256] vpminsd xmm2{k5}{z}, xmm7, xmm0 vpminsd xmm2{k5}{z}, xmm7, [rbx] vpminsd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpminsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpminsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpminsd ymm16, ymm13, ymm15 vpminsd ymm16, ymm13, [rbx] vpminsd ymm16, ymm13, [rbx]{1to8} vpminsd ymm16, ymm13, [rbx+r11*8+256] vpminsd ymm16, ymm13, [rbx+r11*8-256] vpminsd ymm16{k5}, ymm13, ymm15 vpminsd ymm16{k5}, ymm13, [rbx] vpminsd ymm16{k5}, ymm13, [rbx]{1to8} vpminsd ymm16{k5}, ymm13, [rbx+r11*8+256] vpminsd ymm16{k5}, ymm13, [rbx+r11*8-256] vpminsd ymm16{k5}{z}, ymm13, ymm15 vpminsd ymm16{k5}{z}, ymm13, [rbx] vpminsd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpminsd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpminsd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpminsd zmm24, zmm24, zmm31 vpminsd zmm24, zmm24, [rbx] vpminsd zmm24, zmm24, [rbx]{1to16} vpminsd zmm24, zmm24, [rbx+r11*8+256] vpminsd zmm24, zmm24, [rbx+r11*8-256] vpminsd zmm24{k5}, zmm24, zmm31 vpminsd zmm24{k5}, zmm24, [rbx] vpminsd zmm24{k5}, zmm24, [rbx]{1to16} vpminsd zmm24{k5}, zmm24, [rbx+r11*8+256] vpminsd zmm24{k5}, zmm24, [rbx+r11*8-256] vpminsd zmm24{k5}{z}, zmm24, zmm31 vpminsd zmm24{k5}{z}, zmm24, [rbx] vpminsd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpminsd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpminsd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpminsq xmm2, xmm7, xmm0 vpminsq xmm2, xmm7, [rbx] vpminsq xmm2, xmm7, [rbx]{1to2} vpminsq xmm2, xmm7, [rbx+r11*8+256] vpminsq xmm2, xmm7, [rbx+r11*8-256] vpminsq xmm2{k5}, xmm7, xmm0 vpminsq xmm2{k5}, xmm7, [rbx] vpminsq xmm2{k5}, xmm7, [rbx]{1to2} vpminsq xmm2{k5}, xmm7, [rbx+r11*8+256] vpminsq xmm2{k5}, xmm7, [rbx+r11*8-256] vpminsq xmm2{k5}{z}, xmm7, xmm0 vpminsq xmm2{k5}{z}, xmm7, [rbx] vpminsq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpminsq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpminsq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpminsq ymm16, ymm13, ymm15 vpminsq ymm16, ymm13, [rbx] vpminsq ymm16, ymm13, [rbx]{1to4} vpminsq ymm16, ymm13, [rbx+r11*8+256] vpminsq ymm16, ymm13, [rbx+r11*8-256] vpminsq ymm16{k5}, ymm13, ymm15 vpminsq ymm16{k5}, ymm13, [rbx] vpminsq ymm16{k5}, ymm13, [rbx]{1to4} vpminsq ymm16{k5}, ymm13, [rbx+r11*8+256] vpminsq ymm16{k5}, ymm13, [rbx+r11*8-256] vpminsq ymm16{k5}{z}, ymm13, ymm15 vpminsq ymm16{k5}{z}, ymm13, [rbx] vpminsq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpminsq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpminsq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpminsq zmm24, zmm24, zmm31 vpminsq zmm24, zmm24, [rbx] vpminsq zmm24, zmm24, [rbx]{1to8} vpminsq zmm24, zmm24, [rbx+r11*8+256] vpminsq zmm24, zmm24, [rbx+r11*8-256] vpminsq zmm24{k5}, zmm24, zmm31 vpminsq zmm24{k5}, zmm24, [rbx] vpminsq zmm24{k5}, zmm24, [rbx]{1to8} vpminsq zmm24{k5}, zmm24, [rbx+r11*8+256] vpminsq zmm24{k5}, zmm24, [rbx+r11*8-256] vpminsq zmm24{k5}{z}, zmm24, zmm31 vpminsq zmm24{k5}{z}, zmm24, [rbx] vpminsq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpminsq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpminsq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpminud xmm2, xmm7, xmm0 vpminud xmm2, xmm7, [rbx] vpminud xmm2, xmm7, [rbx]{1to4} vpminud xmm2, xmm7, [rbx+r11*8+256] vpminud xmm2, xmm7, [rbx+r11*8-256] vpminud xmm2{k5}, xmm7, xmm0 vpminud xmm2{k5}, xmm7, [rbx] vpminud xmm2{k5}, xmm7, [rbx]{1to4} vpminud xmm2{k5}, xmm7, [rbx+r11*8+256] vpminud xmm2{k5}, xmm7, [rbx+r11*8-256] vpminud xmm2{k5}{z}, xmm7, xmm0 vpminud xmm2{k5}{z}, xmm7, [rbx] vpminud xmm2{k5}{z}, xmm7, [rbx]{1to4} vpminud xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpminud xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpminud ymm16, ymm13, ymm15 vpminud ymm16, ymm13, [rbx] vpminud ymm16, ymm13, [rbx]{1to8} vpminud ymm16, ymm13, [rbx+r11*8+256] vpminud ymm16, ymm13, [rbx+r11*8-256] vpminud ymm16{k5}, ymm13, ymm15 vpminud ymm16{k5}, ymm13, [rbx] vpminud ymm16{k5}, ymm13, [rbx]{1to8} vpminud ymm16{k5}, ymm13, [rbx+r11*8+256] vpminud ymm16{k5}, ymm13, [rbx+r11*8-256] vpminud ymm16{k5}{z}, ymm13, ymm15 vpminud ymm16{k5}{z}, ymm13, [rbx] vpminud ymm16{k5}{z}, ymm13, [rbx]{1to8} vpminud ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpminud ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpminud zmm24, zmm24, zmm31 vpminud zmm24, zmm24, [rbx] vpminud zmm24, zmm24, [rbx]{1to16} vpminud zmm24, zmm24, [rbx+r11*8+256] vpminud zmm24, zmm24, [rbx+r11*8-256] vpminud zmm24{k5}, zmm24, zmm31 vpminud zmm24{k5}, zmm24, [rbx] vpminud zmm24{k5}, zmm24, [rbx]{1to16} vpminud zmm24{k5}, zmm24, [rbx+r11*8+256] vpminud zmm24{k5}, zmm24, [rbx+r11*8-256] vpminud zmm24{k5}{z}, zmm24, zmm31 vpminud zmm24{k5}{z}, zmm24, [rbx] vpminud zmm24{k5}{z}, zmm24, [rbx]{1to16} vpminud zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpminud zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpminuq xmm2, xmm7, xmm0 vpminuq xmm2, xmm7, [rbx] vpminuq xmm2, xmm7, [rbx]{1to2} vpminuq xmm2, xmm7, [rbx+r11*8+256] vpminuq xmm2, xmm7, [rbx+r11*8-256] vpminuq xmm2{k5}, xmm7, xmm0 vpminuq xmm2{k5}, xmm7, [rbx] vpminuq xmm2{k5}, xmm7, [rbx]{1to2} vpminuq xmm2{k5}, xmm7, [rbx+r11*8+256] vpminuq xmm2{k5}, xmm7, [rbx+r11*8-256] vpminuq xmm2{k5}{z}, xmm7, xmm0 vpminuq xmm2{k5}{z}, xmm7, [rbx] vpminuq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpminuq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpminuq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpminuq ymm16, ymm13, ymm15 vpminuq ymm16, ymm13, [rbx] vpminuq ymm16, ymm13, [rbx]{1to4} vpminuq ymm16, ymm13, [rbx+r11*8+256] vpminuq ymm16, ymm13, [rbx+r11*8-256] vpminuq ymm16{k5}, ymm13, ymm15 vpminuq ymm16{k5}, ymm13, [rbx] vpminuq ymm16{k5}, ymm13, [rbx]{1to4} vpminuq ymm16{k5}, ymm13, [rbx+r11*8+256] vpminuq ymm16{k5}, ymm13, [rbx+r11*8-256] vpminuq ymm16{k5}{z}, ymm13, ymm15 vpminuq ymm16{k5}{z}, ymm13, [rbx] vpminuq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpminuq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpminuq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpminuq zmm24, zmm24, zmm31 vpminuq zmm24, zmm24, [rbx] vpminuq zmm24, zmm24, [rbx]{1to8} vpminuq zmm24, zmm24, [rbx+r11*8+256] vpminuq zmm24, zmm24, [rbx+r11*8-256] vpminuq zmm24{k5}, zmm24, zmm31 vpminuq zmm24{k5}, zmm24, [rbx] vpminuq zmm24{k5}, zmm24, [rbx]{1to8} vpminuq zmm24{k5}, zmm24, [rbx+r11*8+256] vpminuq zmm24{k5}, zmm24, [rbx+r11*8-256] vpminuq zmm24{k5}{z}, zmm24, zmm31 vpminuq zmm24{k5}{z}, zmm24, [rbx] vpminuq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpminuq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpminuq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpmovdb xmm0, xmm2 vpmovdb xmm0, ymm16 vpmovdb xmm0, zmm24 vpmovdb [rbx], xmm2 vpmovdb [rbx], ymm16 vpmovdb [rbx], zmm24 vpmovdb [rbx+r11*8+256], xmm2 vpmovdb [rbx+r11*8+256], ymm16 vpmovdb [rbx+r11*8+256], zmm24 vpmovdb [rbx+r11*8-256], xmm2 vpmovdb [rbx+r11*8-256], ymm16 vpmovdb [rbx+r11*8-256], zmm24 vpmovdw xmm0, xmm2 vpmovdw xmm0, ymm16 vpmovdw ymm15, zmm24 vpmovdw [rbx], xmm2 vpmovdw [rbx], ymm16 vpmovdw [rbx], zmm24 vpmovdw [rbx+r11*8+256], xmm2 vpmovdw [rbx+r11*8+256], ymm16 vpmovdw [rbx+r11*8+256], zmm24 vpmovdw [rbx+r11*8-256], xmm2 vpmovdw [rbx+r11*8-256], ymm16 vpmovdw [rbx+r11*8-256], zmm24 vpmovqb xmm0, xmm2 vpmovqb xmm0, ymm16 vpmovqb xmm0, zmm24 vpmovqb [rbx], xmm2 vpmovqb [rbx], ymm16 vpmovqb [rbx], zmm24 vpmovqb [rbx+r11*8+256], xmm2 vpmovqb [rbx+r11*8+256], ymm16 vpmovqb [rbx+r11*8+256], zmm24 vpmovqb [rbx+r11*8-256], xmm2 vpmovqb [rbx+r11*8-256], ymm16 vpmovqb [rbx+r11*8-256], zmm24 vpmovqd xmm0, xmm2 vpmovqd xmm0, ymm16 vpmovqd ymm15, zmm24 vpmovqd [rbx], xmm2 vpmovqd [rbx], ymm16 vpmovqd [rbx], zmm24 vpmovqd [rbx+r11*8+256], xmm2 vpmovqd [rbx+r11*8+256], ymm16 vpmovqd [rbx+r11*8+256], zmm24 vpmovqd [rbx+r11*8-256], xmm2 vpmovqd [rbx+r11*8-256], ymm16 vpmovqd [rbx+r11*8-256], zmm24 vpmovqw xmm0, xmm2 vpmovqw xmm0, ymm16 vpmovqw xmm0, zmm24 vpmovqw [rbx], xmm2 vpmovqw [rbx], ymm16 vpmovqw [rbx], zmm24 vpmovqw [rbx+r11*8+256], xmm2 vpmovqw [rbx+r11*8+256], ymm16 vpmovqw [rbx+r11*8+256], zmm24 vpmovqw [rbx+r11*8-256], xmm2 vpmovqw [rbx+r11*8-256], ymm16 vpmovqw [rbx+r11*8-256], zmm24 vpmovsdb xmm0, xmm2 vpmovsdb xmm0, ymm16 vpmovsdb xmm0, zmm24 vpmovsdb [rbx], xmm2 vpmovsdb [rbx], ymm16 vpmovsdb [rbx], zmm24 vpmovsdb [rbx+r11*8+256], xmm2 vpmovsdb [rbx+r11*8+256], ymm16 vpmovsdb [rbx+r11*8+256], zmm24 vpmovsdb [rbx+r11*8-256], xmm2 vpmovsdb [rbx+r11*8-256], ymm16 vpmovsdb [rbx+r11*8-256], zmm24 vpmovsdw xmm0, xmm2 vpmovsdw xmm0, ymm16 vpmovsdw ymm15, zmm24 vpmovsdw [rbx], xmm2 vpmovsdw [rbx], ymm16 vpmovsdw [rbx], zmm24 vpmovsdw [rbx+r11*8+256], xmm2 vpmovsdw [rbx+r11*8+256], ymm16 vpmovsdw [rbx+r11*8+256], zmm24 vpmovsdw [rbx+r11*8-256], xmm2 vpmovsdw [rbx+r11*8-256], ymm16 vpmovsdw [rbx+r11*8-256], zmm24 vpmovsqb xmm0, xmm2 vpmovsqb xmm0, ymm16 vpmovsqb xmm0, zmm24 vpmovsqb [rbx], xmm2 vpmovsqb [rbx], ymm16 vpmovsqb [rbx], zmm24 vpmovsqb [rbx+r11*8+256], xmm2 vpmovsqb [rbx+r11*8+256], ymm16 vpmovsqb [rbx+r11*8+256], zmm24 vpmovsqb [rbx+r11*8-256], xmm2 vpmovsqb [rbx+r11*8-256], ymm16 vpmovsqb [rbx+r11*8-256], zmm24 vpmovsqd xmm0, xmm2 vpmovsqd xmm0, ymm16 vpmovsqd ymm15, zmm24 vpmovsqd [rbx], xmm2 vpmovsqd [rbx], ymm16 vpmovsqd [rbx], zmm24 vpmovsqd [rbx+r11*8+256], xmm2 vpmovsqd [rbx+r11*8+256], ymm16 vpmovsqd [rbx+r11*8+256], zmm24 vpmovsqd [rbx+r11*8-256], xmm2 vpmovsqd [rbx+r11*8-256], ymm16 vpmovsqd [rbx+r11*8-256], zmm24 vpmovsqw xmm0, xmm2 vpmovsqw xmm0, ymm16 vpmovsqw xmm0, zmm24 vpmovsqw [rbx], xmm2 vpmovsqw [rbx], ymm16 vpmovsqw [rbx], zmm24 vpmovsqw [rbx+r11*8+256], xmm2 vpmovsqw [rbx+r11*8+256], ymm16 vpmovsqw [rbx+r11*8+256], zmm24 vpmovsqw [rbx+r11*8-256], xmm2 vpmovsqw [rbx+r11*8-256], ymm16 vpmovsqw [rbx+r11*8-256], zmm24 vpmovsxbd xmm2, xmm0 vpmovsxbd xmm2, [rbx] vpmovsxbd xmm2, [rbx+r11*8+256] vpmovsxbd xmm2, [rbx+r11*8-256] vpmovsxbd xmm2{k5}, xmm0 vpmovsxbd xmm2{k5}, [rbx] vpmovsxbd xmm2{k5}, [rbx+r11*8+256] vpmovsxbd xmm2{k5}, [rbx+r11*8-256] vpmovsxbd xmm2{k5}{z}, xmm0 vpmovsxbd xmm2{k5}{z}, [rbx] vpmovsxbd xmm2{k5}{z}, [rbx+r11*8+256] vpmovsxbd xmm2{k5}{z}, [rbx+r11*8-256] vpmovsxbd ymm16, xmm0 vpmovsxbd ymm16, [rbx] vpmovsxbd ymm16, [rbx+r11*8+256] vpmovsxbd ymm16, [rbx+r11*8-256] vpmovsxbd ymm16{k5}, xmm0 vpmovsxbd ymm16{k5}, [rbx] vpmovsxbd ymm16{k5}, [rbx+r11*8+256] vpmovsxbd ymm16{k5}, [rbx+r11*8-256] vpmovsxbd ymm16{k5}{z}, xmm0 vpmovsxbd ymm16{k5}{z}, [rbx] vpmovsxbd ymm16{k5}{z}, [rbx+r11*8+256] vpmovsxbd ymm16{k5}{z}, [rbx+r11*8-256] vpmovsxbd zmm24, xmm0 vpmovsxbd zmm24, [rbx] vpmovsxbd zmm24, [rbx+r11*8+256] vpmovsxbd zmm24, [rbx+r11*8-256] vpmovsxbd zmm24{k5}, xmm0 vpmovsxbd zmm24{k5}, [rbx] vpmovsxbd zmm24{k5}, [rbx+r11*8+256] vpmovsxbd zmm24{k5}, [rbx+r11*8-256] vpmovsxbd zmm24{k5}{z}, xmm0 vpmovsxbd zmm24{k5}{z}, [rbx] vpmovsxbd zmm24{k5}{z}, [rbx+r11*8+256] vpmovsxbd zmm24{k5}{z}, [rbx+r11*8-256] vpmovsxbq xmm2, xmm0 vpmovsxbq xmm2, [rbx] vpmovsxbq xmm2, [rbx+r11*8+256] vpmovsxbq xmm2, [rbx+r11*8-256] vpmovsxbq xmm2{k5}, xmm0 vpmovsxbq xmm2{k5}, [rbx] vpmovsxbq xmm2{k5}, [rbx+r11*8+256] vpmovsxbq xmm2{k5}, [rbx+r11*8-256] vpmovsxbq xmm2{k5}{z}, xmm0 vpmovsxbq xmm2{k5}{z}, [rbx] vpmovsxbq xmm2{k5}{z}, [rbx+r11*8+256] vpmovsxbq xmm2{k5}{z}, [rbx+r11*8-256] vpmovsxbq ymm16, xmm0 vpmovsxbq ymm16, [rbx] vpmovsxbq ymm16, [rbx+r11*8+256] vpmovsxbq ymm16, [rbx+r11*8-256] vpmovsxbq ymm16{k5}, xmm0 vpmovsxbq ymm16{k5}, [rbx] vpmovsxbq ymm16{k5}, [rbx+r11*8+256] vpmovsxbq ymm16{k5}, [rbx+r11*8-256] vpmovsxbq ymm16{k5}{z}, xmm0 vpmovsxbq ymm16{k5}{z}, [rbx] vpmovsxbq ymm16{k5}{z}, [rbx+r11*8+256] vpmovsxbq ymm16{k5}{z}, [rbx+r11*8-256] vpmovsxbq zmm24, xmm0 vpmovsxbq zmm24, [rbx] vpmovsxbq zmm24, [rbx+r11*8+256] vpmovsxbq zmm24, [rbx+r11*8-256] vpmovsxbq zmm24{k5}, xmm0 vpmovsxbq zmm24{k5}, [rbx] vpmovsxbq zmm24{k5}, [rbx+r11*8+256] vpmovsxbq zmm24{k5}, [rbx+r11*8-256] vpmovsxbq zmm24{k5}{z}, xmm0 vpmovsxbq zmm24{k5}{z}, [rbx] vpmovsxbq zmm24{k5}{z}, [rbx+r11*8+256] vpmovsxbq zmm24{k5}{z}, [rbx+r11*8-256] vpmovsxdq xmm2, xmm0 vpmovsxdq xmm2, [rbx] vpmovsxdq xmm2, [rbx+r11*8+256] vpmovsxdq xmm2, [rbx+r11*8-256] vpmovsxdq xmm2{k5}, xmm0 vpmovsxdq xmm2{k5}, [rbx] vpmovsxdq xmm2{k5}, [rbx+r11*8+256] vpmovsxdq xmm2{k5}, [rbx+r11*8-256] vpmovsxdq xmm2{k5}{z}, xmm0 vpmovsxdq xmm2{k5}{z}, [rbx] vpmovsxdq xmm2{k5}{z}, [rbx+r11*8+256] vpmovsxdq xmm2{k5}{z}, [rbx+r11*8-256] vpmovsxdq ymm16, xmm0 vpmovsxdq ymm16, [rbx] vpmovsxdq ymm16, [rbx+r11*8+256] vpmovsxdq ymm16, [rbx+r11*8-256] vpmovsxdq ymm16{k5}, xmm0 vpmovsxdq ymm16{k5}, [rbx] vpmovsxdq ymm16{k5}, [rbx+r11*8+256] vpmovsxdq ymm16{k5}, [rbx+r11*8-256] vpmovsxdq ymm16{k5}{z}, xmm0 vpmovsxdq ymm16{k5}{z}, [rbx] vpmovsxdq ymm16{k5}{z}, [rbx+r11*8+256] vpmovsxdq ymm16{k5}{z}, [rbx+r11*8-256] vpmovsxdq zmm24, ymm15 vpmovsxdq zmm24, [rbx] vpmovsxdq zmm24, [rbx+r11*8+256] vpmovsxdq zmm24, [rbx+r11*8-256] vpmovsxdq zmm24{k5}, ymm15 vpmovsxdq zmm24{k5}, [rbx] vpmovsxdq zmm24{k5}, [rbx+r11*8+256] vpmovsxdq zmm24{k5}, [rbx+r11*8-256] vpmovsxdq zmm24{k5}{z}, ymm15 vpmovsxdq zmm24{k5}{z}, [rbx] vpmovsxdq zmm24{k5}{z}, [rbx+r11*8+256] vpmovsxdq zmm24{k5}{z}, [rbx+r11*8-256] vpmovsxwd xmm2, xmm0 vpmovsxwd xmm2, [rbx] vpmovsxwd xmm2, [rbx+r11*8+256] vpmovsxwd xmm2, [rbx+r11*8-256] vpmovsxwd xmm2{k5}, xmm0 vpmovsxwd xmm2{k5}, [rbx] vpmovsxwd xmm2{k5}, [rbx+r11*8+256] vpmovsxwd xmm2{k5}, [rbx+r11*8-256] vpmovsxwd xmm2{k5}{z}, xmm0 vpmovsxwd xmm2{k5}{z}, [rbx] vpmovsxwd xmm2{k5}{z}, [rbx+r11*8+256] vpmovsxwd xmm2{k5}{z}, [rbx+r11*8-256] vpmovsxwd ymm16, xmm0 vpmovsxwd ymm16, [rbx] vpmovsxwd ymm16, [rbx+r11*8+256] vpmovsxwd ymm16, [rbx+r11*8-256] vpmovsxwd ymm16{k5}, xmm0 vpmovsxwd ymm16{k5}, [rbx] vpmovsxwd ymm16{k5}, [rbx+r11*8+256] vpmovsxwd ymm16{k5}, [rbx+r11*8-256] vpmovsxwd ymm16{k5}{z}, xmm0 vpmovsxwd ymm16{k5}{z}, [rbx] vpmovsxwd ymm16{k5}{z}, [rbx+r11*8+256] vpmovsxwd ymm16{k5}{z}, [rbx+r11*8-256] vpmovsxwd zmm24, ymm15 vpmovsxwd zmm24, [rbx] vpmovsxwd zmm24, [rbx+r11*8+256] vpmovsxwd zmm24, [rbx+r11*8-256] vpmovsxwd zmm24{k5}, ymm15 vpmovsxwd zmm24{k5}, [rbx] vpmovsxwd zmm24{k5}, [rbx+r11*8+256] vpmovsxwd zmm24{k5}, [rbx+r11*8-256] vpmovsxwd zmm24{k5}{z}, ymm15 vpmovsxwd zmm24{k5}{z}, [rbx] vpmovsxwd zmm24{k5}{z}, [rbx+r11*8+256] vpmovsxwd zmm24{k5}{z}, [rbx+r11*8-256] vpmovsxwq xmm2, xmm0 vpmovsxwq xmm2, [rbx] vpmovsxwq xmm2, [rbx+r11*8+256] vpmovsxwq xmm2, [rbx+r11*8-256] vpmovsxwq xmm2{k5}, xmm0 vpmovsxwq xmm2{k5}, [rbx] vpmovsxwq xmm2{k5}, [rbx+r11*8+256] vpmovsxwq xmm2{k5}, [rbx+r11*8-256] vpmovsxwq xmm2{k5}{z}, xmm0 vpmovsxwq xmm2{k5}{z}, [rbx] vpmovsxwq xmm2{k5}{z}, [rbx+r11*8+256] vpmovsxwq xmm2{k5}{z}, [rbx+r11*8-256] vpmovsxwq ymm16, xmm0 vpmovsxwq ymm16, [rbx] vpmovsxwq ymm16, [rbx+r11*8+256] vpmovsxwq ymm16, [rbx+r11*8-256] vpmovsxwq ymm16{k5}, xmm0 vpmovsxwq ymm16{k5}, [rbx] vpmovsxwq ymm16{k5}, [rbx+r11*8+256] vpmovsxwq ymm16{k5}, [rbx+r11*8-256] vpmovsxwq ymm16{k5}{z}, xmm0 vpmovsxwq ymm16{k5}{z}, [rbx] vpmovsxwq ymm16{k5}{z}, [rbx+r11*8+256] vpmovsxwq ymm16{k5}{z}, [rbx+r11*8-256] vpmovsxwq zmm24, xmm0 vpmovsxwq zmm24, [rbx] vpmovsxwq zmm24, [rbx+r11*8+256] vpmovsxwq zmm24, [rbx+r11*8-256] vpmovsxwq zmm24{k5}, xmm0 vpmovsxwq zmm24{k5}, [rbx] vpmovsxwq zmm24{k5}, [rbx+r11*8+256] vpmovsxwq zmm24{k5}, [rbx+r11*8-256] vpmovsxwq zmm24{k5}{z}, xmm0 vpmovsxwq zmm24{k5}{z}, [rbx] vpmovsxwq zmm24{k5}{z}, [rbx+r11*8+256] vpmovsxwq zmm24{k5}{z}, [rbx+r11*8-256] vpmovusdb xmm0, xmm2 vpmovusdb xmm0, ymm16 vpmovusdb xmm0, zmm24 vpmovusdb [rbx], xmm2 vpmovusdb [rbx], ymm16 vpmovusdb [rbx], zmm24 vpmovusdb [rbx+r11*8+256], xmm2 vpmovusdb [rbx+r11*8+256], ymm16 vpmovusdb [rbx+r11*8+256], zmm24 vpmovusdb [rbx+r11*8-256], xmm2 vpmovusdb [rbx+r11*8-256], ymm16 vpmovusdb [rbx+r11*8-256], zmm24 vpmovusdw xmm0, xmm2 vpmovusdw xmm0, ymm16 vpmovusdw ymm15, zmm24 vpmovusdw [rbx], xmm2 vpmovusdw [rbx], ymm16 vpmovusdw [rbx], zmm24 vpmovusdw [rbx+r11*8+256], xmm2 vpmovusdw [rbx+r11*8+256], ymm16 vpmovusdw [rbx+r11*8+256], zmm24 vpmovusdw [rbx+r11*8-256], xmm2 vpmovusdw [rbx+r11*8-256], ymm16 vpmovusdw [rbx+r11*8-256], zmm24 vpmovusqb xmm0, xmm2 vpmovusqb xmm0, ymm16 vpmovusqb xmm0, zmm24 vpmovusqb [rbx], xmm2 vpmovusqb [rbx], ymm16 vpmovusqb [rbx], zmm24 vpmovusqb [rbx+r11*8+256], xmm2 vpmovusqb [rbx+r11*8+256], ymm16 vpmovusqb [rbx+r11*8+256], zmm24 vpmovusqb [rbx+r11*8-256], xmm2 vpmovusqb [rbx+r11*8-256], ymm16 vpmovusqb [rbx+r11*8-256], zmm24 vpmovusqd xmm0, xmm2 vpmovusqd xmm0, ymm16 vpmovusqd ymm15, zmm24 vpmovusqd [rbx], xmm2 vpmovusqd [rbx], ymm16 vpmovusqd [rbx], zmm24 vpmovusqd [rbx+r11*8+256], xmm2 vpmovusqd [rbx+r11*8+256], ymm16 vpmovusqd [rbx+r11*8+256], zmm24 vpmovusqd [rbx+r11*8-256], xmm2 vpmovusqd [rbx+r11*8-256], ymm16 vpmovusqd [rbx+r11*8-256], zmm24 vpmovusqw xmm0, xmm2 vpmovusqw xmm0, ymm16 vpmovusqw xmm0, zmm24 vpmovusqw [rbx], xmm2 vpmovusqw [rbx], ymm16 vpmovusqw [rbx], zmm24 vpmovusqw [rbx+r11*8+256], xmm2 vpmovusqw [rbx+r11*8+256], ymm16 vpmovusqw [rbx+r11*8+256], zmm24 vpmovusqw [rbx+r11*8-256], xmm2 vpmovusqw [rbx+r11*8-256], ymm16 vpmovusqw [rbx+r11*8-256], zmm24 vpmovzxbd xmm2, xmm0 vpmovzxbd xmm2, [rbx] vpmovzxbd xmm2, [rbx+r11*8+256] vpmovzxbd xmm2, [rbx+r11*8-256] vpmovzxbd xmm2{k5}, xmm0 vpmovzxbd xmm2{k5}, [rbx] vpmovzxbd xmm2{k5}, [rbx+r11*8+256] vpmovzxbd xmm2{k5}, [rbx+r11*8-256] vpmovzxbd xmm2{k5}{z}, xmm0 vpmovzxbd xmm2{k5}{z}, [rbx] vpmovzxbd xmm2{k5}{z}, [rbx+r11*8+256] vpmovzxbd xmm2{k5}{z}, [rbx+r11*8-256] vpmovzxbd ymm16, xmm0 vpmovzxbd ymm16, [rbx] vpmovzxbd ymm16, [rbx+r11*8+256] vpmovzxbd ymm16, [rbx+r11*8-256] vpmovzxbd ymm16{k5}, xmm0 vpmovzxbd ymm16{k5}, [rbx] vpmovzxbd ymm16{k5}, [rbx+r11*8+256] vpmovzxbd ymm16{k5}, [rbx+r11*8-256] vpmovzxbd ymm16{k5}{z}, xmm0 vpmovzxbd ymm16{k5}{z}, [rbx] vpmovzxbd ymm16{k5}{z}, [rbx+r11*8+256] vpmovzxbd ymm16{k5}{z}, [rbx+r11*8-256] vpmovzxbd zmm24, xmm0 vpmovzxbd zmm24, [rbx] vpmovzxbd zmm24, [rbx+r11*8+256] vpmovzxbd zmm24, [rbx+r11*8-256] vpmovzxbd zmm24{k5}, xmm0 vpmovzxbd zmm24{k5}, [rbx] vpmovzxbd zmm24{k5}, [rbx+r11*8+256] vpmovzxbd zmm24{k5}, [rbx+r11*8-256] vpmovzxbd zmm24{k5}{z}, xmm0 vpmovzxbd zmm24{k5}{z}, [rbx] vpmovzxbd zmm24{k5}{z}, [rbx+r11*8+256] vpmovzxbd zmm24{k5}{z}, [rbx+r11*8-256] vpmovzxbq xmm2, xmm0 vpmovzxbq xmm2, [rbx] vpmovzxbq xmm2, [rbx+r11*8+256] vpmovzxbq xmm2, [rbx+r11*8-256] vpmovzxbq xmm2{k5}, xmm0 vpmovzxbq xmm2{k5}, [rbx] vpmovzxbq xmm2{k5}, [rbx+r11*8+256] vpmovzxbq xmm2{k5}, [rbx+r11*8-256] vpmovzxbq xmm2{k5}{z}, xmm0 vpmovzxbq xmm2{k5}{z}, [rbx] vpmovzxbq xmm2{k5}{z}, [rbx+r11*8+256] vpmovzxbq xmm2{k5}{z}, [rbx+r11*8-256] vpmovzxbq ymm16, xmm0 vpmovzxbq ymm16, [rbx] vpmovzxbq ymm16, [rbx+r11*8+256] vpmovzxbq ymm16, [rbx+r11*8-256] vpmovzxbq ymm16{k5}, xmm0 vpmovzxbq ymm16{k5}, [rbx] vpmovzxbq ymm16{k5}, [rbx+r11*8+256] vpmovzxbq ymm16{k5}, [rbx+r11*8-256] vpmovzxbq ymm16{k5}{z}, xmm0 vpmovzxbq ymm16{k5}{z}, [rbx] vpmovzxbq ymm16{k5}{z}, [rbx+r11*8+256] vpmovzxbq ymm16{k5}{z}, [rbx+r11*8-256] vpmovzxbq zmm24, xmm0 vpmovzxbq zmm24, [rbx] vpmovzxbq zmm24, [rbx+r11*8+256] vpmovzxbq zmm24, [rbx+r11*8-256] vpmovzxbq zmm24{k5}, xmm0 vpmovzxbq zmm24{k5}, [rbx] vpmovzxbq zmm24{k5}, [rbx+r11*8+256] vpmovzxbq zmm24{k5}, [rbx+r11*8-256] vpmovzxbq zmm24{k5}{z}, xmm0 vpmovzxbq zmm24{k5}{z}, [rbx] vpmovzxbq zmm24{k5}{z}, [rbx+r11*8+256] vpmovzxbq zmm24{k5}{z}, [rbx+r11*8-256] vpmovzxdq xmm2, xmm0 vpmovzxdq xmm2, [rbx] vpmovzxdq xmm2, [rbx+r11*8+256] vpmovzxdq xmm2, [rbx+r11*8-256] vpmovzxdq xmm2{k5}, xmm0 vpmovzxdq xmm2{k5}, [rbx] vpmovzxdq xmm2{k5}, [rbx+r11*8+256] vpmovzxdq xmm2{k5}, [rbx+r11*8-256] vpmovzxdq xmm2{k5}{z}, xmm0 vpmovzxdq xmm2{k5}{z}, [rbx] vpmovzxdq xmm2{k5}{z}, [rbx+r11*8+256] vpmovzxdq xmm2{k5}{z}, [rbx+r11*8-256] vpmovzxdq ymm16, xmm0 vpmovzxdq ymm16, [rbx] vpmovzxdq ymm16, [rbx+r11*8+256] vpmovzxdq ymm16, [rbx+r11*8-256] vpmovzxdq ymm16{k5}, xmm0 vpmovzxdq ymm16{k5}, [rbx] vpmovzxdq ymm16{k5}, [rbx+r11*8+256] vpmovzxdq ymm16{k5}, [rbx+r11*8-256] vpmovzxdq ymm16{k5}{z}, xmm0 vpmovzxdq ymm16{k5}{z}, [rbx] vpmovzxdq ymm16{k5}{z}, [rbx+r11*8+256] vpmovzxdq ymm16{k5}{z}, [rbx+r11*8-256] vpmovzxdq zmm24, ymm15 vpmovzxdq zmm24, [rbx] vpmovzxdq zmm24, [rbx+r11*8+256] vpmovzxdq zmm24, [rbx+r11*8-256] vpmovzxdq zmm24{k5}, ymm15 vpmovzxdq zmm24{k5}, [rbx] vpmovzxdq zmm24{k5}, [rbx+r11*8+256] vpmovzxdq zmm24{k5}, [rbx+r11*8-256] vpmovzxdq zmm24{k5}{z}, ymm15 vpmovzxdq zmm24{k5}{z}, [rbx] vpmovzxdq zmm24{k5}{z}, [rbx+r11*8+256] vpmovzxdq zmm24{k5}{z}, [rbx+r11*8-256] vpmovzxwd xmm2, xmm0 vpmovzxwd xmm2, [rbx] vpmovzxwd xmm2, [rbx+r11*8+256] vpmovzxwd xmm2, [rbx+r11*8-256] vpmovzxwd xmm2{k5}, xmm0 vpmovzxwd xmm2{k5}, [rbx] vpmovzxwd xmm2{k5}, [rbx+r11*8+256] vpmovzxwd xmm2{k5}, [rbx+r11*8-256] vpmovzxwd xmm2{k5}{z}, xmm0 vpmovzxwd xmm2{k5}{z}, [rbx] vpmovzxwd xmm2{k5}{z}, [rbx+r11*8+256] vpmovzxwd xmm2{k5}{z}, [rbx+r11*8-256] vpmovzxwd ymm16, xmm0 vpmovzxwd ymm16, [rbx] vpmovzxwd ymm16, [rbx+r11*8+256] vpmovzxwd ymm16, [rbx+r11*8-256] vpmovzxwd ymm16{k5}, xmm0 vpmovzxwd ymm16{k5}, [rbx] vpmovzxwd ymm16{k5}, [rbx+r11*8+256] vpmovzxwd ymm16{k5}, [rbx+r11*8-256] vpmovzxwd ymm16{k5}{z}, xmm0 vpmovzxwd ymm16{k5}{z}, [rbx] vpmovzxwd ymm16{k5}{z}, [rbx+r11*8+256] vpmovzxwd ymm16{k5}{z}, [rbx+r11*8-256] vpmovzxwd zmm24, ymm15 vpmovzxwd zmm24, [rbx] vpmovzxwd zmm24, [rbx+r11*8+256] vpmovzxwd zmm24, [rbx+r11*8-256] vpmovzxwd zmm24{k5}, ymm15 vpmovzxwd zmm24{k5}, [rbx] vpmovzxwd zmm24{k5}, [rbx+r11*8+256] vpmovzxwd zmm24{k5}, [rbx+r11*8-256] vpmovzxwd zmm24{k5}{z}, ymm15 vpmovzxwd zmm24{k5}{z}, [rbx] vpmovzxwd zmm24{k5}{z}, [rbx+r11*8+256] vpmovzxwd zmm24{k5}{z}, [rbx+r11*8-256] vpmovzxwq xmm2, xmm0 vpmovzxwq xmm2, [rbx] vpmovzxwq xmm2, [rbx+r11*8+256] vpmovzxwq xmm2, [rbx+r11*8-256] vpmovzxwq xmm2{k5}, xmm0 vpmovzxwq xmm2{k5}, [rbx] vpmovzxwq xmm2{k5}, [rbx+r11*8+256] vpmovzxwq xmm2{k5}, [rbx+r11*8-256] vpmovzxwq xmm2{k5}{z}, xmm0 vpmovzxwq xmm2{k5}{z}, [rbx] vpmovzxwq xmm2{k5}{z}, [rbx+r11*8+256] vpmovzxwq xmm2{k5}{z}, [rbx+r11*8-256] vpmovzxwq ymm16, xmm0 vpmovzxwq ymm16, [rbx] vpmovzxwq ymm16, [rbx+r11*8+256] vpmovzxwq ymm16, [rbx+r11*8-256] vpmovzxwq ymm16{k5}, xmm0 vpmovzxwq ymm16{k5}, [rbx] vpmovzxwq ymm16{k5}, [rbx+r11*8+256] vpmovzxwq ymm16{k5}, [rbx+r11*8-256] vpmovzxwq ymm16{k5}{z}, xmm0 vpmovzxwq ymm16{k5}{z}, [rbx] vpmovzxwq ymm16{k5}{z}, [rbx+r11*8+256] vpmovzxwq ymm16{k5}{z}, [rbx+r11*8-256] vpmovzxwq zmm24, xmm0 vpmovzxwq zmm24, [rbx] vpmovzxwq zmm24, [rbx+r11*8+256] vpmovzxwq zmm24, [rbx+r11*8-256] vpmovzxwq zmm24{k5}, xmm0 vpmovzxwq zmm24{k5}, [rbx] vpmovzxwq zmm24{k5}, [rbx+r11*8+256] vpmovzxwq zmm24{k5}, [rbx+r11*8-256] vpmovzxwq zmm24{k5}{z}, xmm0 vpmovzxwq zmm24{k5}{z}, [rbx] vpmovzxwq zmm24{k5}{z}, [rbx+r11*8+256] vpmovzxwq zmm24{k5}{z}, [rbx+r11*8-256] vpmuldq xmm2, xmm7, xmm0 vpmuldq xmm2, xmm7, [rbx] vpmuldq xmm2, xmm7, [rbx]{1to2} vpmuldq xmm2, xmm7, [rbx+r11*8+256] vpmuldq xmm2, xmm7, [rbx+r11*8-256] vpmuldq xmm2{k5}, xmm7, xmm0 vpmuldq xmm2{k5}, xmm7, [rbx] vpmuldq xmm2{k5}, xmm7, [rbx]{1to2} vpmuldq xmm2{k5}, xmm7, [rbx+r11*8+256] vpmuldq xmm2{k5}, xmm7, [rbx+r11*8-256] vpmuldq xmm2{k5}{z}, xmm7, xmm0 vpmuldq xmm2{k5}{z}, xmm7, [rbx] vpmuldq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpmuldq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpmuldq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpmuldq ymm16, ymm13, ymm15 vpmuldq ymm16, ymm13, [rbx] vpmuldq ymm16, ymm13, [rbx]{1to4} vpmuldq ymm16, ymm13, [rbx+r11*8+256] vpmuldq ymm16, ymm13, [rbx+r11*8-256] vpmuldq ymm16{k5}, ymm13, ymm15 vpmuldq ymm16{k5}, ymm13, [rbx] vpmuldq ymm16{k5}, ymm13, [rbx]{1to4} vpmuldq ymm16{k5}, ymm13, [rbx+r11*8+256] vpmuldq ymm16{k5}, ymm13, [rbx+r11*8-256] vpmuldq ymm16{k5}{z}, ymm13, ymm15 vpmuldq ymm16{k5}{z}, ymm13, [rbx] vpmuldq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpmuldq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpmuldq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpmuldq zmm24, zmm24, zmm31 vpmuldq zmm24, zmm24, [rbx] vpmuldq zmm24, zmm24, [rbx]{1to8} vpmuldq zmm24, zmm24, [rbx+r11*8+256] vpmuldq zmm24, zmm24, [rbx+r11*8-256] vpmuldq zmm24{k5}, zmm24, zmm31 vpmuldq zmm24{k5}, zmm24, [rbx] vpmuldq zmm24{k5}, zmm24, [rbx]{1to8} vpmuldq zmm24{k5}, zmm24, [rbx+r11*8+256] vpmuldq zmm24{k5}, zmm24, [rbx+r11*8-256] vpmuldq zmm24{k5}{z}, zmm24, zmm31 vpmuldq zmm24{k5}{z}, zmm24, [rbx] vpmuldq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpmuldq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpmuldq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpmulld xmm2, xmm7, xmm0 vpmulld xmm2, xmm7, [rbx] vpmulld xmm2, xmm7, [rbx]{1to4} vpmulld xmm2, xmm7, [rbx+r11*8+256] vpmulld xmm2, xmm7, [rbx+r11*8-256] vpmulld xmm2{k5}, xmm7, xmm0 vpmulld xmm2{k5}, xmm7, [rbx] vpmulld xmm2{k5}, xmm7, [rbx]{1to4} vpmulld xmm2{k5}, xmm7, [rbx+r11*8+256] vpmulld xmm2{k5}, xmm7, [rbx+r11*8-256] vpmulld xmm2{k5}{z}, xmm7, xmm0 vpmulld xmm2{k5}{z}, xmm7, [rbx] vpmulld xmm2{k5}{z}, xmm7, [rbx]{1to4} vpmulld xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpmulld xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpmulld ymm16, ymm13, ymm15 vpmulld ymm16, ymm13, [rbx] vpmulld ymm16, ymm13, [rbx]{1to8} vpmulld ymm16, ymm13, [rbx+r11*8+256] vpmulld ymm16, ymm13, [rbx+r11*8-256] vpmulld ymm16{k5}, ymm13, ymm15 vpmulld ymm16{k5}, ymm13, [rbx] vpmulld ymm16{k5}, ymm13, [rbx]{1to8} vpmulld ymm16{k5}, ymm13, [rbx+r11*8+256] vpmulld ymm16{k5}, ymm13, [rbx+r11*8-256] vpmulld ymm16{k5}{z}, ymm13, ymm15 vpmulld ymm16{k5}{z}, ymm13, [rbx] vpmulld ymm16{k5}{z}, ymm13, [rbx]{1to8} vpmulld ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpmulld ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpmulld zmm24, zmm24, zmm31 vpmulld zmm24, zmm24, [rbx] vpmulld zmm24, zmm24, [rbx]{1to16} vpmulld zmm24, zmm24, [rbx+r11*8+256] vpmulld zmm24, zmm24, [rbx+r11*8-256] vpmulld zmm24{k5}, zmm24, zmm31 vpmulld zmm24{k5}, zmm24, [rbx] vpmulld zmm24{k5}, zmm24, [rbx]{1to16} vpmulld zmm24{k5}, zmm24, [rbx+r11*8+256] vpmulld zmm24{k5}, zmm24, [rbx+r11*8-256] vpmulld zmm24{k5}{z}, zmm24, zmm31 vpmulld zmm24{k5}{z}, zmm24, [rbx] vpmulld zmm24{k5}{z}, zmm24, [rbx]{1to16} vpmulld zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpmulld zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpmuludq xmm2, xmm7, xmm0 vpmuludq xmm2, xmm7, [rbx] vpmuludq xmm2, xmm7, [rbx]{1to2} vpmuludq xmm2, xmm7, [rbx+r11*8+256] vpmuludq xmm2, xmm7, [rbx+r11*8-256] vpmuludq xmm2{k5}, xmm7, xmm0 vpmuludq xmm2{k5}, xmm7, [rbx] vpmuludq xmm2{k5}, xmm7, [rbx]{1to2} vpmuludq xmm2{k5}, xmm7, [rbx+r11*8+256] vpmuludq xmm2{k5}, xmm7, [rbx+r11*8-256] vpmuludq xmm2{k5}{z}, xmm7, xmm0 vpmuludq xmm2{k5}{z}, xmm7, [rbx] vpmuludq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpmuludq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpmuludq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpmuludq ymm16, ymm13, ymm15 vpmuludq ymm16, ymm13, [rbx] vpmuludq ymm16, ymm13, [rbx]{1to4} vpmuludq ymm16, ymm13, [rbx+r11*8+256] vpmuludq ymm16, ymm13, [rbx+r11*8-256] vpmuludq ymm16{k5}, ymm13, ymm15 vpmuludq ymm16{k5}, ymm13, [rbx] vpmuludq ymm16{k5}, ymm13, [rbx]{1to4} vpmuludq ymm16{k5}, ymm13, [rbx+r11*8+256] vpmuludq ymm16{k5}, ymm13, [rbx+r11*8-256] vpmuludq ymm16{k5}{z}, ymm13, ymm15 vpmuludq ymm16{k5}{z}, ymm13, [rbx] vpmuludq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpmuludq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpmuludq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpmuludq zmm24, zmm24, zmm31 vpmuludq zmm24, zmm24, [rbx] vpmuludq zmm24, zmm24, [rbx]{1to8} vpmuludq zmm24, zmm24, [rbx+r11*8+256] vpmuludq zmm24, zmm24, [rbx+r11*8-256] vpmuludq zmm24{k5}, zmm24, zmm31 vpmuludq zmm24{k5}, zmm24, [rbx] vpmuludq zmm24{k5}, zmm24, [rbx]{1to8} vpmuludq zmm24{k5}, zmm24, [rbx+r11*8+256] vpmuludq zmm24{k5}, zmm24, [rbx+r11*8-256] vpmuludq zmm24{k5}{z}, zmm24, zmm31 vpmuludq zmm24{k5}{z}, zmm24, [rbx] vpmuludq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpmuludq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpmuludq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpord xmm2, xmm7, xmm0 vpord xmm2, xmm7, [rbx] vpord xmm2, xmm7, [rbx]{1to4} vpord xmm2, xmm7, [rbx+r11*8+256] vpord xmm2, xmm7, [rbx+r11*8-256] vpord xmm2{k5}, xmm7, xmm0 vpord xmm2{k5}, xmm7, [rbx] vpord xmm2{k5}, xmm7, [rbx]{1to4} vpord xmm2{k5}, xmm7, [rbx+r11*8+256] vpord xmm2{k5}, xmm7, [rbx+r11*8-256] vpord xmm2{k5}{z}, xmm7, xmm0 vpord xmm2{k5}{z}, xmm7, [rbx] vpord xmm2{k5}{z}, xmm7, [rbx]{1to4} vpord xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpord xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpord ymm16, ymm13, ymm15 vpord ymm16, ymm13, [rbx] vpord ymm16, ymm13, [rbx]{1to8} vpord ymm16, ymm13, [rbx+r11*8+256] vpord ymm16, ymm13, [rbx+r11*8-256] vpord ymm16{k5}, ymm13, ymm15 vpord ymm16{k5}, ymm13, [rbx] vpord ymm16{k5}, ymm13, [rbx]{1to8} vpord ymm16{k5}, ymm13, [rbx+r11*8+256] vpord ymm16{k5}, ymm13, [rbx+r11*8-256] vpord ymm16{k5}{z}, ymm13, ymm15 vpord ymm16{k5}{z}, ymm13, [rbx] vpord ymm16{k5}{z}, ymm13, [rbx]{1to8} vpord ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpord ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpord zmm24, zmm24, zmm31 vpord zmm24, zmm24, [rbx] vpord zmm24, zmm24, [rbx]{1to16} vpord zmm24, zmm24, [rbx+r11*8+256] vpord zmm24, zmm24, [rbx+r11*8-256] vpord zmm24{k5}, zmm24, zmm31 vpord zmm24{k5}, zmm24, [rbx] vpord zmm24{k5}, zmm24, [rbx]{1to16} vpord zmm24{k5}, zmm24, [rbx+r11*8+256] vpord zmm24{k5}, zmm24, [rbx+r11*8-256] vpord zmm24{k5}{z}, zmm24, zmm31 vpord zmm24{k5}{z}, zmm24, [rbx] vpord zmm24{k5}{z}, zmm24, [rbx]{1to16} vpord zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpord zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vporq xmm2, xmm7, xmm0 vporq xmm2, xmm7, [rbx] vporq xmm2, xmm7, [rbx]{1to2} vporq xmm2, xmm7, [rbx+r11*8+256] vporq xmm2, xmm7, [rbx+r11*8-256] vporq xmm2{k5}, xmm7, xmm0 vporq xmm2{k5}, xmm7, [rbx] vporq xmm2{k5}, xmm7, [rbx]{1to2} vporq xmm2{k5}, xmm7, [rbx+r11*8+256] vporq xmm2{k5}, xmm7, [rbx+r11*8-256] vporq xmm2{k5}{z}, xmm7, xmm0 vporq xmm2{k5}{z}, xmm7, [rbx] vporq xmm2{k5}{z}, xmm7, [rbx]{1to2} vporq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vporq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vporq ymm16, ymm13, ymm15 vporq ymm16, ymm13, [rbx] vporq ymm16, ymm13, [rbx]{1to4} vporq ymm16, ymm13, [rbx+r11*8+256] vporq ymm16, ymm13, [rbx+r11*8-256] vporq ymm16{k5}, ymm13, ymm15 vporq ymm16{k5}, ymm13, [rbx] vporq ymm16{k5}, ymm13, [rbx]{1to4} vporq ymm16{k5}, ymm13, [rbx+r11*8+256] vporq ymm16{k5}, ymm13, [rbx+r11*8-256] vporq ymm16{k5}{z}, ymm13, ymm15 vporq ymm16{k5}{z}, ymm13, [rbx] vporq ymm16{k5}{z}, ymm13, [rbx]{1to4} vporq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vporq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vporq zmm24, zmm24, zmm31 vporq zmm24, zmm24, [rbx] vporq zmm24, zmm24, [rbx]{1to8} vporq zmm24, zmm24, [rbx+r11*8+256] vporq zmm24, zmm24, [rbx+r11*8-256] vporq zmm24{k5}, zmm24, zmm31 vporq zmm24{k5}, zmm24, [rbx] vporq zmm24{k5}, zmm24, [rbx]{1to8} vporq zmm24{k5}, zmm24, [rbx+r11*8+256] vporq zmm24{k5}, zmm24, [rbx+r11*8-256] vporq zmm24{k5}{z}, zmm24, zmm31 vporq zmm24{k5}{z}, zmm24, [rbx] vporq zmm24{k5}{z}, zmm24, [rbx]{1to8} vporq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vporq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vprold xmm7, xmm0, 10 vprold xmm7, [rbx], 10 vprold xmm7, [rbx]{1to4}, 10 vprold xmm7, [rbx+r11*8+256], 10 vprold xmm7, [rbx+r11*8-256], 10 vprold ymm13, ymm15, 10 vprold ymm13, [rbx], 10 vprold ymm13, [rbx]{1to8}, 10 vprold ymm13, [rbx+r11*8+256], 10 vprold ymm13, [rbx+r11*8-256], 10 vprold zmm24, zmm31, 10 vprold zmm24, [rbx], 10 vprold zmm24, [rbx]{1to16}, 10 vprold zmm24, [rbx+r11*8+256], 10 vprold zmm24, [rbx+r11*8-256], 10 vprolq xmm7, xmm0, 10 vprolq xmm7, [rbx], 10 vprolq xmm7, [rbx]{1to2}, 10 vprolq xmm7, [rbx+r11*8+256], 10 vprolq xmm7, [rbx+r11*8-256], 10 vprolq ymm13, ymm15, 10 vprolq ymm13, [rbx], 10 vprolq ymm13, [rbx]{1to4}, 10 vprolq ymm13, [rbx+r11*8+256], 10 vprolq ymm13, [rbx+r11*8-256], 10 vprolq zmm24, zmm31, 10 vprolq zmm24, [rbx], 10 vprolq zmm24, [rbx]{1to8}, 10 vprolq zmm24, [rbx+r11*8+256], 10 vprolq zmm24, [rbx+r11*8-256], 10 vprolvd xmm2, xmm7, xmm0 vprolvd xmm2, xmm7, [rbx] vprolvd xmm2, xmm7, [rbx]{1to4} vprolvd xmm2, xmm7, [rbx+r11*8+256] vprolvd xmm2, xmm7, [rbx+r11*8-256] vprolvd xmm2{k5}, xmm7, xmm0 vprolvd xmm2{k5}, xmm7, [rbx] vprolvd xmm2{k5}, xmm7, [rbx]{1to4} vprolvd xmm2{k5}, xmm7, [rbx+r11*8+256] vprolvd xmm2{k5}, xmm7, [rbx+r11*8-256] vprolvd xmm2{k5}{z}, xmm7, xmm0 vprolvd xmm2{k5}{z}, xmm7, [rbx] vprolvd xmm2{k5}{z}, xmm7, [rbx]{1to4} vprolvd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vprolvd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vprolvd ymm16, ymm13, ymm15 vprolvd ymm16, ymm13, [rbx] vprolvd ymm16, ymm13, [rbx]{1to8} vprolvd ymm16, ymm13, [rbx+r11*8+256] vprolvd ymm16, ymm13, [rbx+r11*8-256] vprolvd ymm16{k5}, ymm13, ymm15 vprolvd ymm16{k5}, ymm13, [rbx] vprolvd ymm16{k5}, ymm13, [rbx]{1to8} vprolvd ymm16{k5}, ymm13, [rbx+r11*8+256] vprolvd ymm16{k5}, ymm13, [rbx+r11*8-256] vprolvd ymm16{k5}{z}, ymm13, ymm15 vprolvd ymm16{k5}{z}, ymm13, [rbx] vprolvd ymm16{k5}{z}, ymm13, [rbx]{1to8} vprolvd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vprolvd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vprolvd zmm24, zmm24, zmm31 vprolvd zmm24, zmm24, [rbx] vprolvd zmm24, zmm24, [rbx]{1to16} vprolvd zmm24, zmm24, [rbx+r11*8+256] vprolvd zmm24, zmm24, [rbx+r11*8-256] vprolvd zmm24{k5}, zmm24, zmm31 vprolvd zmm24{k5}, zmm24, [rbx] vprolvd zmm24{k5}, zmm24, [rbx]{1to16} vprolvd zmm24{k5}, zmm24, [rbx+r11*8+256] vprolvd zmm24{k5}, zmm24, [rbx+r11*8-256] vprolvd zmm24{k5}{z}, zmm24, zmm31 vprolvd zmm24{k5}{z}, zmm24, [rbx] vprolvd zmm24{k5}{z}, zmm24, [rbx]{1to16} vprolvd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vprolvd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vprolvq xmm2, xmm7, xmm0 vprolvq xmm2, xmm7, [rbx] vprolvq xmm2, xmm7, [rbx]{1to2} vprolvq xmm2, xmm7, [rbx+r11*8+256] vprolvq xmm2, xmm7, [rbx+r11*8-256] vprolvq xmm2{k5}, xmm7, xmm0 vprolvq xmm2{k5}, xmm7, [rbx] vprolvq xmm2{k5}, xmm7, [rbx]{1to2} vprolvq xmm2{k5}, xmm7, [rbx+r11*8+256] vprolvq xmm2{k5}, xmm7, [rbx+r11*8-256] vprolvq xmm2{k5}{z}, xmm7, xmm0 vprolvq xmm2{k5}{z}, xmm7, [rbx] vprolvq xmm2{k5}{z}, xmm7, [rbx]{1to2} vprolvq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vprolvq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vprolvq ymm16, ymm13, ymm15 vprolvq ymm16, ymm13, [rbx] vprolvq ymm16, ymm13, [rbx]{1to4} vprolvq ymm16, ymm13, [rbx+r11*8+256] vprolvq ymm16, ymm13, [rbx+r11*8-256] vprolvq ymm16{k5}, ymm13, ymm15 vprolvq ymm16{k5}, ymm13, [rbx] vprolvq ymm16{k5}, ymm13, [rbx]{1to4} vprolvq ymm16{k5}, ymm13, [rbx+r11*8+256] vprolvq ymm16{k5}, ymm13, [rbx+r11*8-256] vprolvq ymm16{k5}{z}, ymm13, ymm15 vprolvq ymm16{k5}{z}, ymm13, [rbx] vprolvq ymm16{k5}{z}, ymm13, [rbx]{1to4} vprolvq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vprolvq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vprolvq zmm24, zmm24, zmm31 vprolvq zmm24, zmm24, [rbx] vprolvq zmm24, zmm24, [rbx]{1to8} vprolvq zmm24, zmm24, [rbx+r11*8+256] vprolvq zmm24, zmm24, [rbx+r11*8-256] vprolvq zmm24{k5}, zmm24, zmm31 vprolvq zmm24{k5}, zmm24, [rbx] vprolvq zmm24{k5}, zmm24, [rbx]{1to8} vprolvq zmm24{k5}, zmm24, [rbx+r11*8+256] vprolvq zmm24{k5}, zmm24, [rbx+r11*8-256] vprolvq zmm24{k5}{z}, zmm24, zmm31 vprolvq zmm24{k5}{z}, zmm24, [rbx] vprolvq zmm24{k5}{z}, zmm24, [rbx]{1to8} vprolvq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vprolvq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vprord xmm7, xmm0, 10 vprord xmm7, [rbx], 10 vprord xmm7, [rbx]{1to4}, 10 vprord xmm7, [rbx+r11*8+256], 10 vprord xmm7, [rbx+r11*8-256], 10 vprord ymm13, ymm15, 10 vprord ymm13, [rbx], 10 vprord ymm13, [rbx]{1to8}, 10 vprord ymm13, [rbx+r11*8+256], 10 vprord ymm13, [rbx+r11*8-256], 10 vprord zmm24, zmm31, 10 vprord zmm24, [rbx], 10 vprord zmm24, [rbx]{1to16}, 10 vprord zmm24, [rbx+r11*8+256], 10 vprord zmm24, [rbx+r11*8-256], 10 vprorq xmm7, xmm0, 10 vprorq xmm7, [rbx], 10 vprorq xmm7, [rbx]{1to2}, 10 vprorq xmm7, [rbx+r11*8+256], 10 vprorq xmm7, [rbx+r11*8-256], 10 vprorq ymm13, ymm15, 10 vprorq ymm13, [rbx], 10 vprorq ymm13, [rbx]{1to4}, 10 vprorq ymm13, [rbx+r11*8+256], 10 vprorq ymm13, [rbx+r11*8-256], 10 vprorq zmm24, zmm31, 10 vprorq zmm24, [rbx], 10 vprorq zmm24, [rbx]{1to8}, 10 vprorq zmm24, [rbx+r11*8+256], 10 vprorq zmm24, [rbx+r11*8-256], 10 vprorvd xmm2, xmm7, xmm0 vprorvd xmm2, xmm7, [rbx] vprorvd xmm2, xmm7, [rbx]{1to4} vprorvd xmm2, xmm7, [rbx+r11*8+256] vprorvd xmm2, xmm7, [rbx+r11*8-256] vprorvd xmm2{k5}, xmm7, xmm0 vprorvd xmm2{k5}, xmm7, [rbx] vprorvd xmm2{k5}, xmm7, [rbx]{1to4} vprorvd xmm2{k5}, xmm7, [rbx+r11*8+256] vprorvd xmm2{k5}, xmm7, [rbx+r11*8-256] vprorvd xmm2{k5}{z}, xmm7, xmm0 vprorvd xmm2{k5}{z}, xmm7, [rbx] vprorvd xmm2{k5}{z}, xmm7, [rbx]{1to4} vprorvd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vprorvd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vprorvd ymm16, ymm13, ymm15 vprorvd ymm16, ymm13, [rbx] vprorvd ymm16, ymm13, [rbx]{1to8} vprorvd ymm16, ymm13, [rbx+r11*8+256] vprorvd ymm16, ymm13, [rbx+r11*8-256] vprorvd ymm16{k5}, ymm13, ymm15 vprorvd ymm16{k5}, ymm13, [rbx] vprorvd ymm16{k5}, ymm13, [rbx]{1to8} vprorvd ymm16{k5}, ymm13, [rbx+r11*8+256] vprorvd ymm16{k5}, ymm13, [rbx+r11*8-256] vprorvd ymm16{k5}{z}, ymm13, ymm15 vprorvd ymm16{k5}{z}, ymm13, [rbx] vprorvd ymm16{k5}{z}, ymm13, [rbx]{1to8} vprorvd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vprorvd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vprorvd zmm24, zmm24, zmm31 vprorvd zmm24, zmm24, [rbx] vprorvd zmm24, zmm24, [rbx]{1to16} vprorvd zmm24, zmm24, [rbx+r11*8+256] vprorvd zmm24, zmm24, [rbx+r11*8-256] vprorvd zmm24{k5}, zmm24, zmm31 vprorvd zmm24{k5}, zmm24, [rbx] vprorvd zmm24{k5}, zmm24, [rbx]{1to16} vprorvd zmm24{k5}, zmm24, [rbx+r11*8+256] vprorvd zmm24{k5}, zmm24, [rbx+r11*8-256] vprorvd zmm24{k5}{z}, zmm24, zmm31 vprorvd zmm24{k5}{z}, zmm24, [rbx] vprorvd zmm24{k5}{z}, zmm24, [rbx]{1to16} vprorvd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vprorvd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vprorvq xmm2, xmm7, xmm0 vprorvq xmm2, xmm7, [rbx] vprorvq xmm2, xmm7, [rbx]{1to2} vprorvq xmm2, xmm7, [rbx+r11*8+256] vprorvq xmm2, xmm7, [rbx+r11*8-256] vprorvq xmm2{k5}, xmm7, xmm0 vprorvq xmm2{k5}, xmm7, [rbx] vprorvq xmm2{k5}, xmm7, [rbx]{1to2} vprorvq xmm2{k5}, xmm7, [rbx+r11*8+256] vprorvq xmm2{k5}, xmm7, [rbx+r11*8-256] vprorvq xmm2{k5}{z}, xmm7, xmm0 vprorvq xmm2{k5}{z}, xmm7, [rbx] vprorvq xmm2{k5}{z}, xmm7, [rbx]{1to2} vprorvq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vprorvq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vprorvq ymm16, ymm13, ymm15 vprorvq ymm16, ymm13, [rbx] vprorvq ymm16, ymm13, [rbx]{1to4} vprorvq ymm16, ymm13, [rbx+r11*8+256] vprorvq ymm16, ymm13, [rbx+r11*8-256] vprorvq ymm16{k5}, ymm13, ymm15 vprorvq ymm16{k5}, ymm13, [rbx] vprorvq ymm16{k5}, ymm13, [rbx]{1to4} vprorvq ymm16{k5}, ymm13, [rbx+r11*8+256] vprorvq ymm16{k5}, ymm13, [rbx+r11*8-256] vprorvq ymm16{k5}{z}, ymm13, ymm15 vprorvq ymm16{k5}{z}, ymm13, [rbx] vprorvq ymm16{k5}{z}, ymm13, [rbx]{1to4} vprorvq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vprorvq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vprorvq zmm24, zmm24, zmm31 vprorvq zmm24, zmm24, [rbx] vprorvq zmm24, zmm24, [rbx]{1to8} vprorvq zmm24, zmm24, [rbx+r11*8+256] vprorvq zmm24, zmm24, [rbx+r11*8-256] vprorvq zmm24{k5}, zmm24, zmm31 vprorvq zmm24{k5}, zmm24, [rbx] vprorvq zmm24{k5}, zmm24, [rbx]{1to8} vprorvq zmm24{k5}, zmm24, [rbx+r11*8+256] vprorvq zmm24{k5}, zmm24, [rbx+r11*8-256] vprorvq zmm24{k5}{z}, zmm24, zmm31 vprorvq zmm24{k5}{z}, zmm24, [rbx] vprorvq zmm24{k5}{z}, zmm24, [rbx]{1to8} vprorvq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vprorvq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpshufd xmm2, xmm0, 10 vpshufd xmm2, [rbx], 10 vpshufd xmm2, [rbx]{1to4}, 10 vpshufd xmm2, [rbx+r11*8+256], 10 vpshufd xmm2, [rbx+r11*8-256], 10 vpshufd xmm2{k5}, xmm0, 10 vpshufd xmm2{k5}, [rbx], 10 vpshufd xmm2{k5}, [rbx]{1to4}, 10 vpshufd xmm2{k5}, [rbx+r11*8+256], 10 vpshufd xmm2{k5}, [rbx+r11*8-256], 10 vpshufd xmm2{k5}{z}, xmm0, 10 vpshufd xmm2{k5}{z}, [rbx], 10 vpshufd xmm2{k5}{z}, [rbx]{1to4}, 10 vpshufd xmm2{k5}{z}, [rbx+r11*8+256], 10 vpshufd xmm2{k5}{z}, [rbx+r11*8-256], 10 vpshufd ymm16, ymm15, 10 vpshufd ymm16, [rbx], 10 vpshufd ymm16, [rbx]{1to8}, 10 vpshufd ymm16, [rbx+r11*8+256], 10 vpshufd ymm16, [rbx+r11*8-256], 10 vpshufd ymm16{k5}, ymm15, 10 vpshufd ymm16{k5}, [rbx], 10 vpshufd ymm16{k5}, [rbx]{1to8}, 10 vpshufd ymm16{k5}, [rbx+r11*8+256], 10 vpshufd ymm16{k5}, [rbx+r11*8-256], 10 vpshufd ymm16{k5}{z}, ymm15, 10 vpshufd ymm16{k5}{z}, [rbx], 10 vpshufd ymm16{k5}{z}, [rbx]{1to8}, 10 vpshufd ymm16{k5}{z}, [rbx+r11*8+256], 10 vpshufd ymm16{k5}{z}, [rbx+r11*8-256], 10 vpshufd zmm24, zmm31, 10 vpshufd zmm24, [rbx], 10 vpshufd zmm24, [rbx]{1to16}, 10 vpshufd zmm24, [rbx+r11*8+256], 10 vpshufd zmm24, [rbx+r11*8-256], 10 vpshufd zmm24{k5}, zmm31, 10 vpshufd zmm24{k5}, [rbx], 10 vpshufd zmm24{k5}, [rbx]{1to16}, 10 vpshufd zmm24{k5}, [rbx+r11*8+256], 10 vpshufd zmm24{k5}, [rbx+r11*8-256], 10 vpshufd zmm24{k5}{z}, zmm31, 10 vpshufd zmm24{k5}{z}, [rbx], 10 vpshufd zmm24{k5}{z}, [rbx]{1to16}, 10 vpshufd zmm24{k5}{z}, [rbx+r11*8+256], 10 vpshufd zmm24{k5}{z}, [rbx+r11*8-256], 10 vpslld xmm7, xmm0, 10 vpslld xmm7, [rbx], 10 vpslld xmm7, [rbx]{1to4}, 10 vpslld xmm7, [rbx+r11*8+256], 10 vpslld xmm7, [rbx+r11*8-256], 10 vpslld ymm13, ymm15, 10 vpslld ymm13, [rbx], 10 vpslld ymm13, [rbx]{1to8}, 10 vpslld ymm13, [rbx+r11*8+256], 10 vpslld ymm13, [rbx+r11*8-256], 10 vpslld zmm24, zmm31, 10 vpslld zmm24, [rbx], 10 vpslld zmm24, [rbx]{1to16}, 10 vpslld zmm24, [rbx+r11*8+256], 10 vpslld zmm24, [rbx+r11*8-256], 10 vpslld xmm2, xmm7, xmm0 vpslld xmm2, xmm7, [rbx] vpslld xmm2, xmm7, [rbx+r11*8+256] vpslld xmm2, xmm7, [rbx+r11*8-256] vpslld xmm2{k5}, xmm7, xmm0 vpslld xmm2{k5}, xmm7, [rbx] vpslld xmm2{k5}, xmm7, [rbx+r11*8+256] vpslld xmm2{k5}, xmm7, [rbx+r11*8-256] vpslld xmm2{k5}{z}, xmm7, xmm0 vpslld xmm2{k5}{z}, xmm7, [rbx] vpslld xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpslld xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpslld ymm16, ymm13, xmm0 vpslld ymm16, ymm13, [rbx] vpslld ymm16, ymm13, [rbx+r11*8+256] vpslld ymm16, ymm13, [rbx+r11*8-256] vpslld ymm16{k5}, ymm13, xmm0 vpslld ymm16{k5}, ymm13, [rbx] vpslld ymm16{k5}, ymm13, [rbx+r11*8+256] vpslld ymm16{k5}, ymm13, [rbx+r11*8-256] vpslld ymm16{k5}{z}, ymm13, xmm0 vpslld ymm16{k5}{z}, ymm13, [rbx] vpslld ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpslld ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpslld zmm24, zmm24, xmm0 vpslld zmm24, zmm24, [rbx] vpslld zmm24, zmm24, [rbx+r11*8+256] vpslld zmm24, zmm24, [rbx+r11*8-256] vpslld zmm24{k5}, zmm24, xmm0 vpslld zmm24{k5}, zmm24, [rbx] vpslld zmm24{k5}, zmm24, [rbx+r11*8+256] vpslld zmm24{k5}, zmm24, [rbx+r11*8-256] vpslld zmm24{k5}{z}, zmm24, xmm0 vpslld zmm24{k5}{z}, zmm24, [rbx] vpslld zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpslld zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsllq xmm7, xmm0, 10 vpsllq xmm7, [rbx], 10 vpsllq xmm7, [rbx]{1to2}, 10 vpsllq xmm7, [rbx+r11*8+256], 10 vpsllq xmm7, [rbx+r11*8-256], 10 vpsllq ymm13, ymm15, 10 vpsllq ymm13, [rbx], 10 vpsllq ymm13, [rbx]{1to4}, 10 vpsllq ymm13, [rbx+r11*8+256], 10 vpsllq ymm13, [rbx+r11*8-256], 10 vpsllq zmm24, zmm31, 10 vpsllq zmm24, [rbx], 10 vpsllq zmm24, [rbx]{1to8}, 10 vpsllq zmm24, [rbx+r11*8+256], 10 vpsllq zmm24, [rbx+r11*8-256], 10 vpsllq xmm2, xmm7, xmm0 vpsllq xmm2, xmm7, [rbx] vpsllq xmm2, xmm7, [rbx+r11*8+256] vpsllq xmm2, xmm7, [rbx+r11*8-256] vpsllq xmm2{k5}, xmm7, xmm0 vpsllq xmm2{k5}, xmm7, [rbx] vpsllq xmm2{k5}, xmm7, [rbx+r11*8+256] vpsllq xmm2{k5}, xmm7, [rbx+r11*8-256] vpsllq xmm2{k5}{z}, xmm7, xmm0 vpsllq xmm2{k5}{z}, xmm7, [rbx] vpsllq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsllq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsllq ymm16, ymm13, xmm0 vpsllq ymm16, ymm13, [rbx] vpsllq ymm16, ymm13, [rbx+r11*8+256] vpsllq ymm16, ymm13, [rbx+r11*8-256] vpsllq ymm16{k5}, ymm13, xmm0 vpsllq ymm16{k5}, ymm13, [rbx] vpsllq ymm16{k5}, ymm13, [rbx+r11*8+256] vpsllq ymm16{k5}, ymm13, [rbx+r11*8-256] vpsllq ymm16{k5}{z}, ymm13, xmm0 vpsllq ymm16{k5}{z}, ymm13, [rbx] vpsllq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsllq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsllq zmm24, zmm24, xmm0 vpsllq zmm24, zmm24, [rbx] vpsllq zmm24, zmm24, [rbx+r11*8+256] vpsllq zmm24, zmm24, [rbx+r11*8-256] vpsllq zmm24{k5}, zmm24, xmm0 vpsllq zmm24{k5}, zmm24, [rbx] vpsllq zmm24{k5}, zmm24, [rbx+r11*8+256] vpsllq zmm24{k5}, zmm24, [rbx+r11*8-256] vpsllq zmm24{k5}{z}, zmm24, xmm0 vpsllq zmm24{k5}{z}, zmm24, [rbx] vpsllq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsllq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsllvd xmm2, xmm7, xmm0 vpsllvd xmm2, xmm7, [rbx] vpsllvd xmm2, xmm7, [rbx]{1to4} vpsllvd xmm2, xmm7, [rbx+r11*8+256] vpsllvd xmm2, xmm7, [rbx+r11*8-256] vpsllvd xmm2{k5}, xmm7, xmm0 vpsllvd xmm2{k5}, xmm7, [rbx] vpsllvd xmm2{k5}, xmm7, [rbx]{1to4} vpsllvd xmm2{k5}, xmm7, [rbx+r11*8+256] vpsllvd xmm2{k5}, xmm7, [rbx+r11*8-256] vpsllvd xmm2{k5}{z}, xmm7, xmm0 vpsllvd xmm2{k5}{z}, xmm7, [rbx] vpsllvd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpsllvd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsllvd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsllvd ymm16, ymm13, ymm15 vpsllvd ymm16, ymm13, [rbx] vpsllvd ymm16, ymm13, [rbx]{1to8} vpsllvd ymm16, ymm13, [rbx+r11*8+256] vpsllvd ymm16, ymm13, [rbx+r11*8-256] vpsllvd ymm16{k5}, ymm13, ymm15 vpsllvd ymm16{k5}, ymm13, [rbx] vpsllvd ymm16{k5}, ymm13, [rbx]{1to8} vpsllvd ymm16{k5}, ymm13, [rbx+r11*8+256] vpsllvd ymm16{k5}, ymm13, [rbx+r11*8-256] vpsllvd ymm16{k5}{z}, ymm13, ymm15 vpsllvd ymm16{k5}{z}, ymm13, [rbx] vpsllvd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpsllvd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsllvd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsllvd zmm24, zmm24, zmm31 vpsllvd zmm24, zmm24, [rbx] vpsllvd zmm24, zmm24, [rbx]{1to16} vpsllvd zmm24, zmm24, [rbx+r11*8+256] vpsllvd zmm24, zmm24, [rbx+r11*8-256] vpsllvd zmm24{k5}, zmm24, zmm31 vpsllvd zmm24{k5}, zmm24, [rbx] vpsllvd zmm24{k5}, zmm24, [rbx]{1to16} vpsllvd zmm24{k5}, zmm24, [rbx+r11*8+256] vpsllvd zmm24{k5}, zmm24, [rbx+r11*8-256] vpsllvd zmm24{k5}{z}, zmm24, zmm31 vpsllvd zmm24{k5}{z}, zmm24, [rbx] vpsllvd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpsllvd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsllvd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsllvq xmm2, xmm7, xmm0 vpsllvq xmm2, xmm7, [rbx] vpsllvq xmm2, xmm7, [rbx]{1to2} vpsllvq xmm2, xmm7, [rbx+r11*8+256] vpsllvq xmm2, xmm7, [rbx+r11*8-256] vpsllvq xmm2{k5}, xmm7, xmm0 vpsllvq xmm2{k5}, xmm7, [rbx] vpsllvq xmm2{k5}, xmm7, [rbx]{1to2} vpsllvq xmm2{k5}, xmm7, [rbx+r11*8+256] vpsllvq xmm2{k5}, xmm7, [rbx+r11*8-256] vpsllvq xmm2{k5}{z}, xmm7, xmm0 vpsllvq xmm2{k5}{z}, xmm7, [rbx] vpsllvq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpsllvq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsllvq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsllvq ymm16, ymm13, ymm15 vpsllvq ymm16, ymm13, [rbx] vpsllvq ymm16, ymm13, [rbx]{1to4} vpsllvq ymm16, ymm13, [rbx+r11*8+256] vpsllvq ymm16, ymm13, [rbx+r11*8-256] vpsllvq ymm16{k5}, ymm13, ymm15 vpsllvq ymm16{k5}, ymm13, [rbx] vpsllvq ymm16{k5}, ymm13, [rbx]{1to4} vpsllvq ymm16{k5}, ymm13, [rbx+r11*8+256] vpsllvq ymm16{k5}, ymm13, [rbx+r11*8-256] vpsllvq ymm16{k5}{z}, ymm13, ymm15 vpsllvq ymm16{k5}{z}, ymm13, [rbx] vpsllvq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpsllvq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsllvq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsllvq zmm24, zmm24, zmm31 vpsllvq zmm24, zmm24, [rbx] vpsllvq zmm24, zmm24, [rbx]{1to8} vpsllvq zmm24, zmm24, [rbx+r11*8+256] vpsllvq zmm24, zmm24, [rbx+r11*8-256] vpsllvq zmm24{k5}, zmm24, zmm31 vpsllvq zmm24{k5}, zmm24, [rbx] vpsllvq zmm24{k5}, zmm24, [rbx]{1to8} vpsllvq zmm24{k5}, zmm24, [rbx+r11*8+256] vpsllvq zmm24{k5}, zmm24, [rbx+r11*8-256] vpsllvq zmm24{k5}{z}, zmm24, zmm31 vpsllvq zmm24{k5}{z}, zmm24, [rbx] vpsllvq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpsllvq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsllvq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsrad xmm7, xmm0, 10 vpsrad xmm7, [rbx], 10 vpsrad xmm7, [rbx]{1to4}, 10 vpsrad xmm7, [rbx+r11*8+256], 10 vpsrad xmm7, [rbx+r11*8-256], 10 vpsrad ymm13, ymm15, 10 vpsrad ymm13, [rbx], 10 vpsrad ymm13, [rbx]{1to8}, 10 vpsrad ymm13, [rbx+r11*8+256], 10 vpsrad ymm13, [rbx+r11*8-256], 10 vpsrad zmm24, zmm31, 10 vpsrad zmm24, [rbx], 10 vpsrad zmm24, [rbx]{1to16}, 10 vpsrad zmm24, [rbx+r11*8+256], 10 vpsrad zmm24, [rbx+r11*8-256], 10 vpsrad xmm2, xmm7, xmm0 vpsrad xmm2, xmm7, [rbx] vpsrad xmm2, xmm7, [rbx+r11*8+256] vpsrad xmm2, xmm7, [rbx+r11*8-256] vpsrad xmm2{k5}, xmm7, xmm0 vpsrad xmm2{k5}, xmm7, [rbx] vpsrad xmm2{k5}, xmm7, [rbx+r11*8+256] vpsrad xmm2{k5}, xmm7, [rbx+r11*8-256] vpsrad xmm2{k5}{z}, xmm7, xmm0 vpsrad xmm2{k5}{z}, xmm7, [rbx] vpsrad xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsrad xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsrad ymm16, ymm13, xmm0 vpsrad ymm16, ymm13, [rbx] vpsrad ymm16, ymm13, [rbx+r11*8+256] vpsrad ymm16, ymm13, [rbx+r11*8-256] vpsrad ymm16{k5}, ymm13, xmm0 vpsrad ymm16{k5}, ymm13, [rbx] vpsrad ymm16{k5}, ymm13, [rbx+r11*8+256] vpsrad ymm16{k5}, ymm13, [rbx+r11*8-256] vpsrad ymm16{k5}{z}, ymm13, xmm0 vpsrad ymm16{k5}{z}, ymm13, [rbx] vpsrad ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsrad ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsrad zmm24, zmm24, xmm0 vpsrad zmm24, zmm24, [rbx] vpsrad zmm24, zmm24, [rbx+r11*8+256] vpsrad zmm24, zmm24, [rbx+r11*8-256] vpsrad zmm24{k5}, zmm24, xmm0 vpsrad zmm24{k5}, zmm24, [rbx] vpsrad zmm24{k5}, zmm24, [rbx+r11*8+256] vpsrad zmm24{k5}, zmm24, [rbx+r11*8-256] vpsrad zmm24{k5}{z}, zmm24, xmm0 vpsrad zmm24{k5}{z}, zmm24, [rbx] vpsrad zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsrad zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsraq xmm7, xmm0, 10 vpsraq xmm7, [rbx], 10 vpsraq xmm7, [rbx]{1to2}, 10 vpsraq xmm7, [rbx+r11*8+256], 10 vpsraq xmm7, [rbx+r11*8-256], 10 vpsraq ymm13, ymm15, 10 vpsraq ymm13, [rbx], 10 vpsraq ymm13, [rbx]{1to4}, 10 vpsraq ymm13, [rbx+r11*8+256], 10 vpsraq ymm13, [rbx+r11*8-256], 10 vpsraq zmm24, zmm31, 10 vpsraq zmm24, [rbx], 10 vpsraq zmm24, [rbx]{1to8}, 10 vpsraq zmm24, [rbx+r11*8+256], 10 vpsraq zmm24, [rbx+r11*8-256], 10 vpsraq xmm2, xmm7, xmm0 vpsraq xmm2, xmm7, [rbx] vpsraq xmm2, xmm7, [rbx+r11*8+256] vpsraq xmm2, xmm7, [rbx+r11*8-256] vpsraq xmm2{k5}, xmm7, xmm0 vpsraq xmm2{k5}, xmm7, [rbx] vpsraq xmm2{k5}, xmm7, [rbx+r11*8+256] vpsraq xmm2{k5}, xmm7, [rbx+r11*8-256] vpsraq xmm2{k5}{z}, xmm7, xmm0 vpsraq xmm2{k5}{z}, xmm7, [rbx] vpsraq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsraq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsraq ymm16, ymm13, xmm0 vpsraq ymm16, ymm13, [rbx] vpsraq ymm16, ymm13, [rbx+r11*8+256] vpsraq ymm16, ymm13, [rbx+r11*8-256] vpsraq ymm16{k5}, ymm13, xmm0 vpsraq ymm16{k5}, ymm13, [rbx] vpsraq ymm16{k5}, ymm13, [rbx+r11*8+256] vpsraq ymm16{k5}, ymm13, [rbx+r11*8-256] vpsraq ymm16{k5}{z}, ymm13, xmm0 vpsraq ymm16{k5}{z}, ymm13, [rbx] vpsraq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsraq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsraq zmm24, zmm24, xmm0 vpsraq zmm24, zmm24, [rbx] vpsraq zmm24, zmm24, [rbx+r11*8+256] vpsraq zmm24, zmm24, [rbx+r11*8-256] vpsraq zmm24{k5}, zmm24, xmm0 vpsraq zmm24{k5}, zmm24, [rbx] vpsraq zmm24{k5}, zmm24, [rbx+r11*8+256] vpsraq zmm24{k5}, zmm24, [rbx+r11*8-256] vpsraq zmm24{k5}{z}, zmm24, xmm0 vpsraq zmm24{k5}{z}, zmm24, [rbx] vpsraq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsraq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsravd xmm2, xmm7, xmm0 vpsravd xmm2, xmm7, [rbx] vpsravd xmm2, xmm7, [rbx]{1to4} vpsravd xmm2, xmm7, [rbx+r11*8+256] vpsravd xmm2, xmm7, [rbx+r11*8-256] vpsravd xmm2{k5}, xmm7, xmm0 vpsravd xmm2{k5}, xmm7, [rbx] vpsravd xmm2{k5}, xmm7, [rbx]{1to4} vpsravd xmm2{k5}, xmm7, [rbx+r11*8+256] vpsravd xmm2{k5}, xmm7, [rbx+r11*8-256] vpsravd xmm2{k5}{z}, xmm7, xmm0 vpsravd xmm2{k5}{z}, xmm7, [rbx] vpsravd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpsravd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsravd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsravd ymm16, ymm13, ymm15 vpsravd ymm16, ymm13, [rbx] vpsravd ymm16, ymm13, [rbx]{1to8} vpsravd ymm16, ymm13, [rbx+r11*8+256] vpsravd ymm16, ymm13, [rbx+r11*8-256] vpsravd ymm16{k5}, ymm13, ymm15 vpsravd ymm16{k5}, ymm13, [rbx] vpsravd ymm16{k5}, ymm13, [rbx]{1to8} vpsravd ymm16{k5}, ymm13, [rbx+r11*8+256] vpsravd ymm16{k5}, ymm13, [rbx+r11*8-256] vpsravd ymm16{k5}{z}, ymm13, ymm15 vpsravd ymm16{k5}{z}, ymm13, [rbx] vpsravd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpsravd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsravd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsravd zmm24, zmm24, zmm31 vpsravd zmm24, zmm24, [rbx] vpsravd zmm24, zmm24, [rbx]{1to16} vpsravd zmm24, zmm24, [rbx+r11*8+256] vpsravd zmm24, zmm24, [rbx+r11*8-256] vpsravd zmm24{k5}, zmm24, zmm31 vpsravd zmm24{k5}, zmm24, [rbx] vpsravd zmm24{k5}, zmm24, [rbx]{1to16} vpsravd zmm24{k5}, zmm24, [rbx+r11*8+256] vpsravd zmm24{k5}, zmm24, [rbx+r11*8-256] vpsravd zmm24{k5}{z}, zmm24, zmm31 vpsravd zmm24{k5}{z}, zmm24, [rbx] vpsravd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpsravd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsravd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsravq xmm2, xmm7, xmm0 vpsravq xmm2, xmm7, [rbx] vpsravq xmm2, xmm7, [rbx]{1to2} vpsravq xmm2, xmm7, [rbx+r11*8+256] vpsravq xmm2, xmm7, [rbx+r11*8-256] vpsravq xmm2{k5}, xmm7, xmm0 vpsravq xmm2{k5}, xmm7, [rbx] vpsravq xmm2{k5}, xmm7, [rbx]{1to2} vpsravq xmm2{k5}, xmm7, [rbx+r11*8+256] vpsravq xmm2{k5}, xmm7, [rbx+r11*8-256] vpsravq xmm2{k5}{z}, xmm7, xmm0 vpsravq xmm2{k5}{z}, xmm7, [rbx] vpsravq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpsravq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsravq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsravq ymm16, ymm13, ymm15 vpsravq ymm16, ymm13, [rbx] vpsravq ymm16, ymm13, [rbx]{1to4} vpsravq ymm16, ymm13, [rbx+r11*8+256] vpsravq ymm16, ymm13, [rbx+r11*8-256] vpsravq ymm16{k5}, ymm13, ymm15 vpsravq ymm16{k5}, ymm13, [rbx] vpsravq ymm16{k5}, ymm13, [rbx]{1to4} vpsravq ymm16{k5}, ymm13, [rbx+r11*8+256] vpsravq ymm16{k5}, ymm13, [rbx+r11*8-256] vpsravq ymm16{k5}{z}, ymm13, ymm15 vpsravq ymm16{k5}{z}, ymm13, [rbx] vpsravq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpsravq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsravq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsravq zmm24, zmm24, zmm31 vpsravq zmm24, zmm24, [rbx] vpsravq zmm24, zmm24, [rbx]{1to8} vpsravq zmm24, zmm24, [rbx+r11*8+256] vpsravq zmm24, zmm24, [rbx+r11*8-256] vpsravq zmm24{k5}, zmm24, zmm31 vpsravq zmm24{k5}, zmm24, [rbx] vpsravq zmm24{k5}, zmm24, [rbx]{1to8} vpsravq zmm24{k5}, zmm24, [rbx+r11*8+256] vpsravq zmm24{k5}, zmm24, [rbx+r11*8-256] vpsravq zmm24{k5}{z}, zmm24, zmm31 vpsravq zmm24{k5}{z}, zmm24, [rbx] vpsravq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpsravq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsravq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsrld xmm7, xmm0, 10 vpsrld xmm7, [rbx], 10 vpsrld xmm7, [rbx]{1to4}, 10 vpsrld xmm7, [rbx+r11*8+256], 10 vpsrld xmm7, [rbx+r11*8-256], 10 vpsrld ymm13, ymm15, 10 vpsrld ymm13, [rbx], 10 vpsrld ymm13, [rbx]{1to8}, 10 vpsrld ymm13, [rbx+r11*8+256], 10 vpsrld ymm13, [rbx+r11*8-256], 10 vpsrld zmm24, zmm31, 10 vpsrld zmm24, [rbx], 10 vpsrld zmm24, [rbx]{1to16}, 10 vpsrld zmm24, [rbx+r11*8+256], 10 vpsrld zmm24, [rbx+r11*8-256], 10 vpsrld xmm2, xmm7, xmm0 vpsrld xmm2, xmm7, [rbx] vpsrld xmm2, xmm7, [rbx+r11*8+256] vpsrld xmm2, xmm7, [rbx+r11*8-256] vpsrld xmm2{k5}, xmm7, xmm0 vpsrld xmm2{k5}, xmm7, [rbx] vpsrld xmm2{k5}, xmm7, [rbx+r11*8+256] vpsrld xmm2{k5}, xmm7, [rbx+r11*8-256] vpsrld xmm2{k5}{z}, xmm7, xmm0 vpsrld xmm2{k5}{z}, xmm7, [rbx] vpsrld xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsrld xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsrld ymm16, ymm13, xmm0 vpsrld ymm16, ymm13, [rbx] vpsrld ymm16, ymm13, [rbx+r11*8+256] vpsrld ymm16, ymm13, [rbx+r11*8-256] vpsrld ymm16{k5}, ymm13, xmm0 vpsrld ymm16{k5}, ymm13, [rbx] vpsrld ymm16{k5}, ymm13, [rbx+r11*8+256] vpsrld ymm16{k5}, ymm13, [rbx+r11*8-256] vpsrld ymm16{k5}{z}, ymm13, xmm0 vpsrld ymm16{k5}{z}, ymm13, [rbx] vpsrld ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsrld ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsrld zmm24, zmm24, xmm0 vpsrld zmm24, zmm24, [rbx] vpsrld zmm24, zmm24, [rbx+r11*8+256] vpsrld zmm24, zmm24, [rbx+r11*8-256] vpsrld zmm24{k5}, zmm24, xmm0 vpsrld zmm24{k5}, zmm24, [rbx] vpsrld zmm24{k5}, zmm24, [rbx+r11*8+256] vpsrld zmm24{k5}, zmm24, [rbx+r11*8-256] vpsrld zmm24{k5}{z}, zmm24, xmm0 vpsrld zmm24{k5}{z}, zmm24, [rbx] vpsrld zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsrld zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsrlq xmm7, xmm0, 10 vpsrlq xmm7, [rbx], 10 vpsrlq xmm7, [rbx]{1to2}, 10 vpsrlq xmm7, [rbx+r11*8+256], 10 vpsrlq xmm7, [rbx+r11*8-256], 10 vpsrlq ymm13, ymm15, 10 vpsrlq ymm13, [rbx], 10 vpsrlq ymm13, [rbx]{1to4}, 10 vpsrlq ymm13, [rbx+r11*8+256], 10 vpsrlq ymm13, [rbx+r11*8-256], 10 vpsrlq zmm24, zmm31, 10 vpsrlq zmm24, [rbx], 10 vpsrlq zmm24, [rbx]{1to8}, 10 vpsrlq zmm24, [rbx+r11*8+256], 10 vpsrlq zmm24, [rbx+r11*8-256], 10 vpsrlq xmm2, xmm7, xmm0 vpsrlq xmm2, xmm7, [rbx] vpsrlq xmm2, xmm7, [rbx+r11*8+256] vpsrlq xmm2, xmm7, [rbx+r11*8-256] vpsrlq xmm2{k5}, xmm7, xmm0 vpsrlq xmm2{k5}, xmm7, [rbx] vpsrlq xmm2{k5}, xmm7, [rbx+r11*8+256] vpsrlq xmm2{k5}, xmm7, [rbx+r11*8-256] vpsrlq xmm2{k5}{z}, xmm7, xmm0 vpsrlq xmm2{k5}{z}, xmm7, [rbx] vpsrlq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsrlq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsrlq ymm16, ymm13, xmm0 vpsrlq ymm16, ymm13, [rbx] vpsrlq ymm16, ymm13, [rbx+r11*8+256] vpsrlq ymm16, ymm13, [rbx+r11*8-256] vpsrlq ymm16{k5}, ymm13, xmm0 vpsrlq ymm16{k5}, ymm13, [rbx] vpsrlq ymm16{k5}, ymm13, [rbx+r11*8+256] vpsrlq ymm16{k5}, ymm13, [rbx+r11*8-256] vpsrlq ymm16{k5}{z}, ymm13, xmm0 vpsrlq ymm16{k5}{z}, ymm13, [rbx] vpsrlq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsrlq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsrlq zmm24, zmm24, xmm0 vpsrlq zmm24, zmm24, [rbx] vpsrlq zmm24, zmm24, [rbx+r11*8+256] vpsrlq zmm24, zmm24, [rbx+r11*8-256] vpsrlq zmm24{k5}, zmm24, xmm0 vpsrlq zmm24{k5}, zmm24, [rbx] vpsrlq zmm24{k5}, zmm24, [rbx+r11*8+256] vpsrlq zmm24{k5}, zmm24, [rbx+r11*8-256] vpsrlq zmm24{k5}{z}, zmm24, xmm0 vpsrlq zmm24{k5}{z}, zmm24, [rbx] vpsrlq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsrlq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsrlvd xmm2, xmm7, xmm0 vpsrlvd xmm2, xmm7, [rbx] vpsrlvd xmm2, xmm7, [rbx]{1to4} vpsrlvd xmm2, xmm7, [rbx+r11*8+256] vpsrlvd xmm2, xmm7, [rbx+r11*8-256] vpsrlvd xmm2{k5}, xmm7, xmm0 vpsrlvd xmm2{k5}, xmm7, [rbx] vpsrlvd xmm2{k5}, xmm7, [rbx]{1to4} vpsrlvd xmm2{k5}, xmm7, [rbx+r11*8+256] vpsrlvd xmm2{k5}, xmm7, [rbx+r11*8-256] vpsrlvd xmm2{k5}{z}, xmm7, xmm0 vpsrlvd xmm2{k5}{z}, xmm7, [rbx] vpsrlvd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpsrlvd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsrlvd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsrlvd ymm16, ymm13, ymm15 vpsrlvd ymm16, ymm13, [rbx] vpsrlvd ymm16, ymm13, [rbx]{1to8} vpsrlvd ymm16, ymm13, [rbx+r11*8+256] vpsrlvd ymm16, ymm13, [rbx+r11*8-256] vpsrlvd ymm16{k5}, ymm13, ymm15 vpsrlvd ymm16{k5}, ymm13, [rbx] vpsrlvd ymm16{k5}, ymm13, [rbx]{1to8} vpsrlvd ymm16{k5}, ymm13, [rbx+r11*8+256] vpsrlvd ymm16{k5}, ymm13, [rbx+r11*8-256] vpsrlvd ymm16{k5}{z}, ymm13, ymm15 vpsrlvd ymm16{k5}{z}, ymm13, [rbx] vpsrlvd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpsrlvd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsrlvd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsrlvd zmm24, zmm24, zmm31 vpsrlvd zmm24, zmm24, [rbx] vpsrlvd zmm24, zmm24, [rbx]{1to16} vpsrlvd zmm24, zmm24, [rbx+r11*8+256] vpsrlvd zmm24, zmm24, [rbx+r11*8-256] vpsrlvd zmm24{k5}, zmm24, zmm31 vpsrlvd zmm24{k5}, zmm24, [rbx] vpsrlvd zmm24{k5}, zmm24, [rbx]{1to16} vpsrlvd zmm24{k5}, zmm24, [rbx+r11*8+256] vpsrlvd zmm24{k5}, zmm24, [rbx+r11*8-256] vpsrlvd zmm24{k5}{z}, zmm24, zmm31 vpsrlvd zmm24{k5}{z}, zmm24, [rbx] vpsrlvd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpsrlvd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsrlvd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsrlvq xmm2, xmm7, xmm0 vpsrlvq xmm2, xmm7, [rbx] vpsrlvq xmm2, xmm7, [rbx]{1to2} vpsrlvq xmm2, xmm7, [rbx+r11*8+256] vpsrlvq xmm2, xmm7, [rbx+r11*8-256] vpsrlvq xmm2{k5}, xmm7, xmm0 vpsrlvq xmm2{k5}, xmm7, [rbx] vpsrlvq xmm2{k5}, xmm7, [rbx]{1to2} vpsrlvq xmm2{k5}, xmm7, [rbx+r11*8+256] vpsrlvq xmm2{k5}, xmm7, [rbx+r11*8-256] vpsrlvq xmm2{k5}{z}, xmm7, xmm0 vpsrlvq xmm2{k5}{z}, xmm7, [rbx] vpsrlvq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpsrlvq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsrlvq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsrlvq ymm16, ymm13, ymm15 vpsrlvq ymm16, ymm13, [rbx] vpsrlvq ymm16, ymm13, [rbx]{1to4} vpsrlvq ymm16, ymm13, [rbx+r11*8+256] vpsrlvq ymm16, ymm13, [rbx+r11*8-256] vpsrlvq ymm16{k5}, ymm13, ymm15 vpsrlvq ymm16{k5}, ymm13, [rbx] vpsrlvq ymm16{k5}, ymm13, [rbx]{1to4} vpsrlvq ymm16{k5}, ymm13, [rbx+r11*8+256] vpsrlvq ymm16{k5}, ymm13, [rbx+r11*8-256] vpsrlvq ymm16{k5}{z}, ymm13, ymm15 vpsrlvq ymm16{k5}{z}, ymm13, [rbx] vpsrlvq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpsrlvq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsrlvq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsrlvq zmm24, zmm24, zmm31 vpsrlvq zmm24, zmm24, [rbx] vpsrlvq zmm24, zmm24, [rbx]{1to8} vpsrlvq zmm24, zmm24, [rbx+r11*8+256] vpsrlvq zmm24, zmm24, [rbx+r11*8-256] vpsrlvq zmm24{k5}, zmm24, zmm31 vpsrlvq zmm24{k5}, zmm24, [rbx] vpsrlvq zmm24{k5}, zmm24, [rbx]{1to8} vpsrlvq zmm24{k5}, zmm24, [rbx+r11*8+256] vpsrlvq zmm24{k5}, zmm24, [rbx+r11*8-256] vpsrlvq zmm24{k5}{z}, zmm24, zmm31 vpsrlvq zmm24{k5}{z}, zmm24, [rbx] vpsrlvq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpsrlvq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsrlvq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsubd xmm2, xmm7, xmm0 vpsubd xmm2, xmm7, [rbx] vpsubd xmm2, xmm7, [rbx]{1to4} vpsubd xmm2, xmm7, [rbx+r11*8+256] vpsubd xmm2, xmm7, [rbx+r11*8-256] vpsubd xmm2{k5}, xmm7, xmm0 vpsubd xmm2{k5}, xmm7, [rbx] vpsubd xmm2{k5}, xmm7, [rbx]{1to4} vpsubd xmm2{k5}, xmm7, [rbx+r11*8+256] vpsubd xmm2{k5}, xmm7, [rbx+r11*8-256] vpsubd xmm2{k5}{z}, xmm7, xmm0 vpsubd xmm2{k5}{z}, xmm7, [rbx] vpsubd xmm2{k5}{z}, xmm7, [rbx]{1to4} vpsubd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsubd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsubd ymm16, ymm13, ymm15 vpsubd ymm16, ymm13, [rbx] vpsubd ymm16, ymm13, [rbx]{1to8} vpsubd ymm16, ymm13, [rbx+r11*8+256] vpsubd ymm16, ymm13, [rbx+r11*8-256] vpsubd ymm16{k5}, ymm13, ymm15 vpsubd ymm16{k5}, ymm13, [rbx] vpsubd ymm16{k5}, ymm13, [rbx]{1to8} vpsubd ymm16{k5}, ymm13, [rbx+r11*8+256] vpsubd ymm16{k5}, ymm13, [rbx+r11*8-256] vpsubd ymm16{k5}{z}, ymm13, ymm15 vpsubd ymm16{k5}{z}, ymm13, [rbx] vpsubd ymm16{k5}{z}, ymm13, [rbx]{1to8} vpsubd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsubd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsubd zmm24, zmm24, zmm31 vpsubd zmm24, zmm24, [rbx] vpsubd zmm24, zmm24, [rbx]{1to16} vpsubd zmm24, zmm24, [rbx+r11*8+256] vpsubd zmm24, zmm24, [rbx+r11*8-256] vpsubd zmm24{k5}, zmm24, zmm31 vpsubd zmm24{k5}, zmm24, [rbx] vpsubd zmm24{k5}, zmm24, [rbx]{1to16} vpsubd zmm24{k5}, zmm24, [rbx+r11*8+256] vpsubd zmm24{k5}, zmm24, [rbx+r11*8-256] vpsubd zmm24{k5}{z}, zmm24, zmm31 vpsubd zmm24{k5}{z}, zmm24, [rbx] vpsubd zmm24{k5}{z}, zmm24, [rbx]{1to16} vpsubd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsubd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpsubq xmm2, xmm7, xmm0 vpsubq xmm2, xmm7, [rbx] vpsubq xmm2, xmm7, [rbx]{1to2} vpsubq xmm2, xmm7, [rbx+r11*8+256] vpsubq xmm2, xmm7, [rbx+r11*8-256] vpsubq xmm2{k5}, xmm7, xmm0 vpsubq xmm2{k5}, xmm7, [rbx] vpsubq xmm2{k5}, xmm7, [rbx]{1to2} vpsubq xmm2{k5}, xmm7, [rbx+r11*8+256] vpsubq xmm2{k5}, xmm7, [rbx+r11*8-256] vpsubq xmm2{k5}{z}, xmm7, xmm0 vpsubq xmm2{k5}{z}, xmm7, [rbx] vpsubq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpsubq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpsubq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpsubq ymm16, ymm13, ymm15 vpsubq ymm16, ymm13, [rbx] vpsubq ymm16, ymm13, [rbx]{1to4} vpsubq ymm16, ymm13, [rbx+r11*8+256] vpsubq ymm16, ymm13, [rbx+r11*8-256] vpsubq ymm16{k5}, ymm13, ymm15 vpsubq ymm16{k5}, ymm13, [rbx] vpsubq ymm16{k5}, ymm13, [rbx]{1to4} vpsubq ymm16{k5}, ymm13, [rbx+r11*8+256] vpsubq ymm16{k5}, ymm13, [rbx+r11*8-256] vpsubq ymm16{k5}{z}, ymm13, ymm15 vpsubq ymm16{k5}{z}, ymm13, [rbx] vpsubq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpsubq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpsubq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpsubq zmm24, zmm24, zmm31 vpsubq zmm24, zmm24, [rbx] vpsubq zmm24, zmm24, [rbx]{1to8} vpsubq zmm24, zmm24, [rbx+r11*8+256] vpsubq zmm24, zmm24, [rbx+r11*8-256] vpsubq zmm24{k5}, zmm24, zmm31 vpsubq zmm24{k5}, zmm24, [rbx] vpsubq zmm24{k5}, zmm24, [rbx]{1to8} vpsubq zmm24{k5}, zmm24, [rbx+r11*8+256] vpsubq zmm24{k5}, zmm24, [rbx+r11*8-256] vpsubq zmm24{k5}{z}, zmm24, zmm31 vpsubq zmm24{k5}{z}, zmm24, [rbx] vpsubq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpsubq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpsubq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpternlogd xmm2, xmm7, xmm0, 10 vpternlogd xmm2, xmm7, [rbx], 10 vpternlogd xmm2, xmm7, [rbx]{1to4}, 10 vpternlogd xmm2, xmm7, [rbx+r11*8+256], 10 vpternlogd xmm2, xmm7, [rbx+r11*8-256], 10 vpternlogd xmm2{k5}, xmm7, xmm0, 10 vpternlogd xmm2{k5}, xmm7, [rbx], 10 vpternlogd xmm2{k5}, xmm7, [rbx]{1to4}, 10 vpternlogd xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vpternlogd xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vpternlogd xmm2{k5}{z}, xmm7, xmm0, 10 vpternlogd xmm2{k5}{z}, xmm7, [rbx], 10 vpternlogd xmm2{k5}{z}, xmm7, [rbx]{1to4}, 10 vpternlogd xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vpternlogd xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vpternlogd ymm16, ymm13, ymm15, 10 vpternlogd ymm16, ymm13, [rbx], 10 vpternlogd ymm16, ymm13, [rbx]{1to8}, 10 vpternlogd ymm16, ymm13, [rbx+r11*8+256], 10 vpternlogd ymm16, ymm13, [rbx+r11*8-256], 10 vpternlogd ymm16{k5}, ymm13, ymm15, 10 vpternlogd ymm16{k5}, ymm13, [rbx], 10 vpternlogd ymm16{k5}, ymm13, [rbx]{1to8}, 10 vpternlogd ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vpternlogd ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vpternlogd ymm16{k5}{z}, ymm13, ymm15, 10 vpternlogd ymm16{k5}{z}, ymm13, [rbx], 10 vpternlogd ymm16{k5}{z}, ymm13, [rbx]{1to8}, 10 vpternlogd ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vpternlogd ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vpternlogd zmm24, zmm24, zmm31, 10 vpternlogd zmm24, zmm24, [rbx], 10 vpternlogd zmm24, zmm24, [rbx]{1to16}, 10 vpternlogd zmm24, zmm24, [rbx+r11*8+256], 10 vpternlogd zmm24, zmm24, [rbx+r11*8-256], 10 vpternlogd zmm24{k5}, zmm24, zmm31, 10 vpternlogd zmm24{k5}, zmm24, [rbx], 10 vpternlogd zmm24{k5}, zmm24, [rbx]{1to16}, 10 vpternlogd zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vpternlogd zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vpternlogd zmm24{k5}{z}, zmm24, zmm31, 10 vpternlogd zmm24{k5}{z}, zmm24, [rbx], 10 vpternlogd zmm24{k5}{z}, zmm24, [rbx]{1to16}, 10 vpternlogd zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vpternlogd zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vpternlogq xmm2, xmm7, xmm0, 10 vpternlogq xmm2, xmm7, [rbx], 10 vpternlogq xmm2, xmm7, [rbx]{1to2}, 10 vpternlogq xmm2, xmm7, [rbx+r11*8+256], 10 vpternlogq xmm2, xmm7, [rbx+r11*8-256], 10 vpternlogq xmm2{k5}, xmm7, xmm0, 10 vpternlogq xmm2{k5}, xmm7, [rbx], 10 vpternlogq xmm2{k5}, xmm7, [rbx]{1to2}, 10 vpternlogq xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vpternlogq xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vpternlogq xmm2{k5}{z}, xmm7, xmm0, 10 vpternlogq xmm2{k5}{z}, xmm7, [rbx], 10 vpternlogq xmm2{k5}{z}, xmm7, [rbx]{1to2}, 10 vpternlogq xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vpternlogq xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vpternlogq ymm16, ymm13, ymm15, 10 vpternlogq ymm16, ymm13, [rbx], 10 vpternlogq ymm16, ymm13, [rbx]{1to4}, 10 vpternlogq ymm16, ymm13, [rbx+r11*8+256], 10 vpternlogq ymm16, ymm13, [rbx+r11*8-256], 10 vpternlogq ymm16{k5}, ymm13, ymm15, 10 vpternlogq ymm16{k5}, ymm13, [rbx], 10 vpternlogq ymm16{k5}, ymm13, [rbx]{1to4}, 10 vpternlogq ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vpternlogq ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vpternlogq ymm16{k5}{z}, ymm13, ymm15, 10 vpternlogq ymm16{k5}{z}, ymm13, [rbx], 10 vpternlogq ymm16{k5}{z}, ymm13, [rbx]{1to4}, 10 vpternlogq ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vpternlogq ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vpternlogq zmm24, zmm24, zmm31, 10 vpternlogq zmm24, zmm24, [rbx], 10 vpternlogq zmm24, zmm24, [rbx]{1to8}, 10 vpternlogq zmm24, zmm24, [rbx+r11*8+256], 10 vpternlogq zmm24, zmm24, [rbx+r11*8-256], 10 vpternlogq zmm24{k5}, zmm24, zmm31, 10 vpternlogq zmm24{k5}, zmm24, [rbx], 10 vpternlogq zmm24{k5}, zmm24, [rbx]{1to8}, 10 vpternlogq zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vpternlogq zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vpternlogq zmm24{k5}{z}, zmm24, zmm31, 10 vpternlogq zmm24{k5}{z}, zmm24, [rbx], 10 vpternlogq zmm24{k5}{z}, zmm24, [rbx]{1to8}, 10 vpternlogq zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vpternlogq zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vptestmd k3, xmm7, xmm0 vptestmd k3, xmm7, [rbx] vptestmd k3, xmm7, [rbx]{1to4} vptestmd k3, xmm7, [rbx+r11*8+256] vptestmd k3, xmm7, [rbx+r11*8-256] vptestmd k3, ymm13, ymm15 vptestmd k3, ymm13, [rbx] vptestmd k3, ymm13, [rbx]{1to8} vptestmd k3, ymm13, [rbx+r11*8+256] vptestmd k3, ymm13, [rbx+r11*8-256] vptestmd k3, zmm24, zmm31 vptestmd k3, zmm24, [rbx] vptestmd k3, zmm24, [rbx]{1to16} vptestmd k3, zmm24, [rbx+r11*8+256] vptestmd k3, zmm24, [rbx+r11*8-256] vptestmd k3{k5}, xmm7, xmm0 vptestmd k3{k5}, xmm7, [rbx] vptestmd k3{k5}, xmm7, [rbx]{1to4} vptestmd k3{k5}, xmm7, [rbx+r11*8+256] vptestmd k3{k5}, xmm7, [rbx+r11*8-256] vptestmd k3{k5}, ymm13, ymm15 vptestmd k3{k5}, ymm13, [rbx] vptestmd k3{k5}, ymm13, [rbx]{1to8} vptestmd k3{k5}, ymm13, [rbx+r11*8+256] vptestmd k3{k5}, ymm13, [rbx+r11*8-256] vptestmd k3{k5}, zmm24, zmm31 vptestmd k3{k5}, zmm24, [rbx] vptestmd k3{k5}, zmm24, [rbx]{1to16} vptestmd k3{k5}, zmm24, [rbx+r11*8+256] vptestmd k3{k5}, zmm24, [rbx+r11*8-256] vptestmq k3, xmm7, xmm0 vptestmq k3, xmm7, [rbx] vptestmq k3, xmm7, [rbx]{1to2} vptestmq k3, xmm7, [rbx+r11*8+256] vptestmq k3, xmm7, [rbx+r11*8-256] vptestmq k3, ymm13, ymm15 vptestmq k3, ymm13, [rbx] vptestmq k3, ymm13, [rbx]{1to4} vptestmq k3, ymm13, [rbx+r11*8+256] vptestmq k3, ymm13, [rbx+r11*8-256] vptestmq k3, zmm24, zmm31 vptestmq k3, zmm24, [rbx] vptestmq k3, zmm24, [rbx]{1to8} vptestmq k3, zmm24, [rbx+r11*8+256] vptestmq k3, zmm24, [rbx+r11*8-256] vptestmq k3{k5}, xmm7, xmm0 vptestmq k3{k5}, xmm7, [rbx] vptestmq k3{k5}, xmm7, [rbx]{1to2} vptestmq k3{k5}, xmm7, [rbx+r11*8+256] vptestmq k3{k5}, xmm7, [rbx+r11*8-256] vptestmq k3{k5}, ymm13, ymm15 vptestmq k3{k5}, ymm13, [rbx] vptestmq k3{k5}, ymm13, [rbx]{1to4} vptestmq k3{k5}, ymm13, [rbx+r11*8+256] vptestmq k3{k5}, ymm13, [rbx+r11*8-256] vptestmq k3{k5}, zmm24, zmm31 vptestmq k3{k5}, zmm24, [rbx] vptestmq k3{k5}, zmm24, [rbx]{1to8} vptestmq k3{k5}, zmm24, [rbx+r11*8+256] vptestmq k3{k5}, zmm24, [rbx+r11*8-256] vptestnmd k3, xmm7, xmm0 vptestnmd k3, xmm7, [rbx] vptestnmd k3, xmm7, [rbx]{1to4} vptestnmd k3, xmm7, [rbx+r11*8+256] vptestnmd k3, xmm7, [rbx+r11*8-256] vptestnmd k3, ymm13, ymm15 vptestnmd k3, ymm13, [rbx] vptestnmd k3, ymm13, [rbx]{1to8} vptestnmd k3, ymm13, [rbx+r11*8+256] vptestnmd k3, ymm13, [rbx+r11*8-256] vptestnmd k3, zmm24, zmm31 vptestnmd k3, zmm24, [rbx] vptestnmd k3, zmm24, [rbx]{1to16} vptestnmd k3, zmm24, [rbx+r11*8+256] vptestnmd k3, zmm24, [rbx+r11*8-256] vptestnmd k3{k5}, xmm7, xmm0 vptestnmd k3{k5}, xmm7, [rbx] vptestnmd k3{k5}, xmm7, [rbx]{1to4} vptestnmd k3{k5}, xmm7, [rbx+r11*8+256] vptestnmd k3{k5}, xmm7, [rbx+r11*8-256] vptestnmd k3{k5}, ymm13, ymm15 vptestnmd k3{k5}, ymm13, [rbx] vptestnmd k3{k5}, ymm13, [rbx]{1to8} vptestnmd k3{k5}, ymm13, [rbx+r11*8+256] vptestnmd k3{k5}, ymm13, [rbx+r11*8-256] vptestnmd k3{k5}, zmm24, zmm31 vptestnmd k3{k5}, zmm24, [rbx] vptestnmd k3{k5}, zmm24, [rbx]{1to16} vptestnmd k3{k5}, zmm24, [rbx+r11*8+256] vptestnmd k3{k5}, zmm24, [rbx+r11*8-256] vptestnmq k3, xmm7, xmm0 vptestnmq k3, xmm7, [rbx] vptestnmq k3, xmm7, [rbx]{1to2} vptestnmq k3, xmm7, [rbx+r11*8+256] vptestnmq k3, xmm7, [rbx+r11*8-256] vptestnmq k3, ymm13, ymm15 vptestnmq k3, ymm13, [rbx] vptestnmq k3, ymm13, [rbx]{1to4} vptestnmq k3, ymm13, [rbx+r11*8+256] vptestnmq k3, ymm13, [rbx+r11*8-256] vptestnmq k3, zmm24, zmm31 vptestnmq k3, zmm24, [rbx] vptestnmq k3, zmm24, [rbx]{1to8} vptestnmq k3, zmm24, [rbx+r11*8+256] vptestnmq k3, zmm24, [rbx+r11*8-256] vptestnmq k3{k5}, xmm7, xmm0 vptestnmq k3{k5}, xmm7, [rbx] vptestnmq k3{k5}, xmm7, [rbx]{1to2} vptestnmq k3{k5}, xmm7, [rbx+r11*8+256] vptestnmq k3{k5}, xmm7, [rbx+r11*8-256] vptestnmq k3{k5}, ymm13, ymm15 vptestnmq k3{k5}, ymm13, [rbx] vptestnmq k3{k5}, ymm13, [rbx]{1to4} vptestnmq k3{k5}, ymm13, [rbx+r11*8+256] vptestnmq k3{k5}, ymm13, [rbx+r11*8-256] vptestnmq k3{k5}, zmm24, zmm31 vptestnmq k3{k5}, zmm24, [rbx] vptestnmq k3{k5}, zmm24, [rbx]{1to8} vptestnmq k3{k5}, zmm24, [rbx+r11*8+256] vptestnmq k3{k5}, zmm24, [rbx+r11*8-256] vpunpckhdq xmm2, xmm7, xmm0 vpunpckhdq xmm2, xmm7, [rbx] vpunpckhdq xmm2, xmm7, [rbx]{1to4} vpunpckhdq xmm2, xmm7, [rbx+r11*8+256] vpunpckhdq xmm2, xmm7, [rbx+r11*8-256] vpunpckhdq xmm2{k5}, xmm7, xmm0 vpunpckhdq xmm2{k5}, xmm7, [rbx] vpunpckhdq xmm2{k5}, xmm7, [rbx]{1to4} vpunpckhdq xmm2{k5}, xmm7, [rbx+r11*8+256] vpunpckhdq xmm2{k5}, xmm7, [rbx+r11*8-256] vpunpckhdq xmm2{k5}{z}, xmm7, xmm0 vpunpckhdq xmm2{k5}{z}, xmm7, [rbx] vpunpckhdq xmm2{k5}{z}, xmm7, [rbx]{1to4} vpunpckhdq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpunpckhdq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpunpckhdq ymm16, ymm13, ymm15 vpunpckhdq ymm16, ymm13, [rbx] vpunpckhdq ymm16, ymm13, [rbx]{1to8} vpunpckhdq ymm16, ymm13, [rbx+r11*8+256] vpunpckhdq ymm16, ymm13, [rbx+r11*8-256] vpunpckhdq ymm16{k5}, ymm13, ymm15 vpunpckhdq ymm16{k5}, ymm13, [rbx] vpunpckhdq ymm16{k5}, ymm13, [rbx]{1to8} vpunpckhdq ymm16{k5}, ymm13, [rbx+r11*8+256] vpunpckhdq ymm16{k5}, ymm13, [rbx+r11*8-256] vpunpckhdq ymm16{k5}{z}, ymm13, ymm15 vpunpckhdq ymm16{k5}{z}, ymm13, [rbx] vpunpckhdq ymm16{k5}{z}, ymm13, [rbx]{1to8} vpunpckhdq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpunpckhdq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpunpckhdq zmm24, zmm24, zmm31 vpunpckhdq zmm24, zmm24, [rbx] vpunpckhdq zmm24, zmm24, [rbx]{1to16} vpunpckhdq zmm24, zmm24, [rbx+r11*8+256] vpunpckhdq zmm24, zmm24, [rbx+r11*8-256] vpunpckhdq zmm24{k5}, zmm24, zmm31 vpunpckhdq zmm24{k5}, zmm24, [rbx] vpunpckhdq zmm24{k5}, zmm24, [rbx]{1to16} vpunpckhdq zmm24{k5}, zmm24, [rbx+r11*8+256] vpunpckhdq zmm24{k5}, zmm24, [rbx+r11*8-256] vpunpckhdq zmm24{k5}{z}, zmm24, zmm31 vpunpckhdq zmm24{k5}{z}, zmm24, [rbx] vpunpckhdq zmm24{k5}{z}, zmm24, [rbx]{1to16} vpunpckhdq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpunpckhdq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpunpckhqdq xmm2, xmm7, xmm0 vpunpckhqdq xmm2, xmm7, [rbx] vpunpckhqdq xmm2, xmm7, [rbx]{1to2} vpunpckhqdq xmm2, xmm7, [rbx+r11*8+256] vpunpckhqdq xmm2, xmm7, [rbx+r11*8-256] vpunpckhqdq xmm2{k5}, xmm7, xmm0 vpunpckhqdq xmm2{k5}, xmm7, [rbx] vpunpckhqdq xmm2{k5}, xmm7, [rbx]{1to2} vpunpckhqdq xmm2{k5}, xmm7, [rbx+r11*8+256] vpunpckhqdq xmm2{k5}, xmm7, [rbx+r11*8-256] vpunpckhqdq xmm2{k5}{z}, xmm7, xmm0 vpunpckhqdq xmm2{k5}{z}, xmm7, [rbx] vpunpckhqdq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpunpckhqdq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpunpckhqdq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpunpckhqdq ymm16, ymm13, ymm15 vpunpckhqdq ymm16, ymm13, [rbx] vpunpckhqdq ymm16, ymm13, [rbx]{1to4} vpunpckhqdq ymm16, ymm13, [rbx+r11*8+256] vpunpckhqdq ymm16, ymm13, [rbx+r11*8-256] vpunpckhqdq ymm16{k5}, ymm13, ymm15 vpunpckhqdq ymm16{k5}, ymm13, [rbx] vpunpckhqdq ymm16{k5}, ymm13, [rbx]{1to4} vpunpckhqdq ymm16{k5}, ymm13, [rbx+r11*8+256] vpunpckhqdq ymm16{k5}, ymm13, [rbx+r11*8-256] vpunpckhqdq ymm16{k5}{z}, ymm13, ymm15 vpunpckhqdq ymm16{k5}{z}, ymm13, [rbx] vpunpckhqdq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpunpckhqdq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpunpckhqdq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpunpckhqdq zmm24, zmm24, zmm31 vpunpckhqdq zmm24, zmm24, [rbx] vpunpckhqdq zmm24, zmm24, [rbx]{1to8} vpunpckhqdq zmm24, zmm24, [rbx+r11*8+256] vpunpckhqdq zmm24, zmm24, [rbx+r11*8-256] vpunpckhqdq zmm24{k5}, zmm24, zmm31 vpunpckhqdq zmm24{k5}, zmm24, [rbx] vpunpckhqdq zmm24{k5}, zmm24, [rbx]{1to8} vpunpckhqdq zmm24{k5}, zmm24, [rbx+r11*8+256] vpunpckhqdq zmm24{k5}, zmm24, [rbx+r11*8-256] vpunpckhqdq zmm24{k5}{z}, zmm24, zmm31 vpunpckhqdq zmm24{k5}{z}, zmm24, [rbx] vpunpckhqdq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpunpckhqdq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpunpckhqdq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpunpckldq xmm2, xmm7, xmm0 vpunpckldq xmm2, xmm7, [rbx] vpunpckldq xmm2, xmm7, [rbx]{1to4} vpunpckldq xmm2, xmm7, [rbx+r11*8+256] vpunpckldq xmm2, xmm7, [rbx+r11*8-256] vpunpckldq xmm2{k5}, xmm7, xmm0 vpunpckldq xmm2{k5}, xmm7, [rbx] vpunpckldq xmm2{k5}, xmm7, [rbx]{1to4} vpunpckldq xmm2{k5}, xmm7, [rbx+r11*8+256] vpunpckldq xmm2{k5}, xmm7, [rbx+r11*8-256] vpunpckldq xmm2{k5}{z}, xmm7, xmm0 vpunpckldq xmm2{k5}{z}, xmm7, [rbx] vpunpckldq xmm2{k5}{z}, xmm7, [rbx]{1to4} vpunpckldq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpunpckldq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpunpckldq ymm16, ymm13, ymm15 vpunpckldq ymm16, ymm13, [rbx] vpunpckldq ymm16, ymm13, [rbx]{1to8} vpunpckldq ymm16, ymm13, [rbx+r11*8+256] vpunpckldq ymm16, ymm13, [rbx+r11*8-256] vpunpckldq ymm16{k5}, ymm13, ymm15 vpunpckldq ymm16{k5}, ymm13, [rbx] vpunpckldq ymm16{k5}, ymm13, [rbx]{1to8} vpunpckldq ymm16{k5}, ymm13, [rbx+r11*8+256] vpunpckldq ymm16{k5}, ymm13, [rbx+r11*8-256] vpunpckldq ymm16{k5}{z}, ymm13, ymm15 vpunpckldq ymm16{k5}{z}, ymm13, [rbx] vpunpckldq ymm16{k5}{z}, ymm13, [rbx]{1to8} vpunpckldq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpunpckldq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpunpckldq zmm24, zmm24, zmm31 vpunpckldq zmm24, zmm24, [rbx] vpunpckldq zmm24, zmm24, [rbx]{1to16} vpunpckldq zmm24, zmm24, [rbx+r11*8+256] vpunpckldq zmm24, zmm24, [rbx+r11*8-256] vpunpckldq zmm24{k5}, zmm24, zmm31 vpunpckldq zmm24{k5}, zmm24, [rbx] vpunpckldq zmm24{k5}, zmm24, [rbx]{1to16} vpunpckldq zmm24{k5}, zmm24, [rbx+r11*8+256] vpunpckldq zmm24{k5}, zmm24, [rbx+r11*8-256] vpunpckldq zmm24{k5}{z}, zmm24, zmm31 vpunpckldq zmm24{k5}{z}, zmm24, [rbx] vpunpckldq zmm24{k5}{z}, zmm24, [rbx]{1to16} vpunpckldq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpunpckldq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpunpcklqdq xmm2, xmm7, xmm0 vpunpcklqdq xmm2, xmm7, [rbx] vpunpcklqdq xmm2, xmm7, [rbx]{1to2} vpunpcklqdq xmm2, xmm7, [rbx+r11*8+256] vpunpcklqdq xmm2, xmm7, [rbx+r11*8-256] vpunpcklqdq xmm2{k5}, xmm7, xmm0 vpunpcklqdq xmm2{k5}, xmm7, [rbx] vpunpcklqdq xmm2{k5}, xmm7, [rbx]{1to2} vpunpcklqdq xmm2{k5}, xmm7, [rbx+r11*8+256] vpunpcklqdq xmm2{k5}, xmm7, [rbx+r11*8-256] vpunpcklqdq xmm2{k5}{z}, xmm7, xmm0 vpunpcklqdq xmm2{k5}{z}, xmm7, [rbx] vpunpcklqdq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpunpcklqdq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpunpcklqdq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpunpcklqdq ymm16, ymm13, ymm15 vpunpcklqdq ymm16, ymm13, [rbx] vpunpcklqdq ymm16, ymm13, [rbx]{1to4} vpunpcklqdq ymm16, ymm13, [rbx+r11*8+256] vpunpcklqdq ymm16, ymm13, [rbx+r11*8-256] vpunpcklqdq ymm16{k5}, ymm13, ymm15 vpunpcklqdq ymm16{k5}, ymm13, [rbx] vpunpcklqdq ymm16{k5}, ymm13, [rbx]{1to4} vpunpcklqdq ymm16{k5}, ymm13, [rbx+r11*8+256] vpunpcklqdq ymm16{k5}, ymm13, [rbx+r11*8-256] vpunpcklqdq ymm16{k5}{z}, ymm13, ymm15 vpunpcklqdq ymm16{k5}{z}, ymm13, [rbx] vpunpcklqdq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpunpcklqdq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpunpcklqdq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpunpcklqdq zmm24, zmm24, zmm31 vpunpcklqdq zmm24, zmm24, [rbx] vpunpcklqdq zmm24, zmm24, [rbx]{1to8} vpunpcklqdq zmm24, zmm24, [rbx+r11*8+256] vpunpcklqdq zmm24, zmm24, [rbx+r11*8-256] vpunpcklqdq zmm24{k5}, zmm24, zmm31 vpunpcklqdq zmm24{k5}, zmm24, [rbx] vpunpcklqdq zmm24{k5}, zmm24, [rbx]{1to8} vpunpcklqdq zmm24{k5}, zmm24, [rbx+r11*8+256] vpunpcklqdq zmm24{k5}, zmm24, [rbx+r11*8-256] vpunpcklqdq zmm24{k5}{z}, zmm24, zmm31 vpunpcklqdq zmm24{k5}{z}, zmm24, [rbx] vpunpcklqdq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpunpcklqdq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpunpcklqdq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpxord xmm2, xmm7, xmm0 vpxord xmm2, xmm7, [rbx] vpxord xmm2, xmm7, [rbx]{1to4} vpxord xmm2, xmm7, [rbx+r11*8+256] vpxord xmm2, xmm7, [rbx+r11*8-256] vpxord xmm2{k5}, xmm7, xmm0 vpxord xmm2{k5}, xmm7, [rbx] vpxord xmm2{k5}, xmm7, [rbx]{1to4} vpxord xmm2{k5}, xmm7, [rbx+r11*8+256] vpxord xmm2{k5}, xmm7, [rbx+r11*8-256] vpxord xmm2{k5}{z}, xmm7, xmm0 vpxord xmm2{k5}{z}, xmm7, [rbx] vpxord xmm2{k5}{z}, xmm7, [rbx]{1to4} vpxord xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpxord xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpxord ymm16, ymm13, ymm15 vpxord ymm16, ymm13, [rbx] vpxord ymm16, ymm13, [rbx]{1to8} vpxord ymm16, ymm13, [rbx+r11*8+256] vpxord ymm16, ymm13, [rbx+r11*8-256] vpxord ymm16{k5}, ymm13, ymm15 vpxord ymm16{k5}, ymm13, [rbx] vpxord ymm16{k5}, ymm13, [rbx]{1to8} vpxord ymm16{k5}, ymm13, [rbx+r11*8+256] vpxord ymm16{k5}, ymm13, [rbx+r11*8-256] vpxord ymm16{k5}{z}, ymm13, ymm15 vpxord ymm16{k5}{z}, ymm13, [rbx] vpxord ymm16{k5}{z}, ymm13, [rbx]{1to8} vpxord ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpxord ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpxord zmm24, zmm24, zmm31 vpxord zmm24, zmm24, [rbx] vpxord zmm24, zmm24, [rbx]{1to16} vpxord zmm24, zmm24, [rbx+r11*8+256] vpxord zmm24, zmm24, [rbx+r11*8-256] vpxord zmm24{k5}, zmm24, zmm31 vpxord zmm24{k5}, zmm24, [rbx] vpxord zmm24{k5}, zmm24, [rbx]{1to16} vpxord zmm24{k5}, zmm24, [rbx+r11*8+256] vpxord zmm24{k5}, zmm24, [rbx+r11*8-256] vpxord zmm24{k5}{z}, zmm24, zmm31 vpxord zmm24{k5}{z}, zmm24, [rbx] vpxord zmm24{k5}{z}, zmm24, [rbx]{1to16} vpxord zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpxord zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vpxorq xmm2, xmm7, xmm0 vpxorq xmm2, xmm7, [rbx] vpxorq xmm2, xmm7, [rbx]{1to2} vpxorq xmm2, xmm7, [rbx+r11*8+256] vpxorq xmm2, xmm7, [rbx+r11*8-256] vpxorq xmm2{k5}, xmm7, xmm0 vpxorq xmm2{k5}, xmm7, [rbx] vpxorq xmm2{k5}, xmm7, [rbx]{1to2} vpxorq xmm2{k5}, xmm7, [rbx+r11*8+256] vpxorq xmm2{k5}, xmm7, [rbx+r11*8-256] vpxorq xmm2{k5}{z}, xmm7, xmm0 vpxorq xmm2{k5}{z}, xmm7, [rbx] vpxorq xmm2{k5}{z}, xmm7, [rbx]{1to2} vpxorq xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vpxorq xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vpxorq ymm16, ymm13, ymm15 vpxorq ymm16, ymm13, [rbx] vpxorq ymm16, ymm13, [rbx]{1to4} vpxorq ymm16, ymm13, [rbx+r11*8+256] vpxorq ymm16, ymm13, [rbx+r11*8-256] vpxorq ymm16{k5}, ymm13, ymm15 vpxorq ymm16{k5}, ymm13, [rbx] vpxorq ymm16{k5}, ymm13, [rbx]{1to4} vpxorq ymm16{k5}, ymm13, [rbx+r11*8+256] vpxorq ymm16{k5}, ymm13, [rbx+r11*8-256] vpxorq ymm16{k5}{z}, ymm13, ymm15 vpxorq ymm16{k5}{z}, ymm13, [rbx] vpxorq ymm16{k5}{z}, ymm13, [rbx]{1to4} vpxorq ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vpxorq ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vpxorq zmm24, zmm24, zmm31 vpxorq zmm24, zmm24, [rbx] vpxorq zmm24, zmm24, [rbx]{1to8} vpxorq zmm24, zmm24, [rbx+r11*8+256] vpxorq zmm24, zmm24, [rbx+r11*8-256] vpxorq zmm24{k5}, zmm24, zmm31 vpxorq zmm24{k5}, zmm24, [rbx] vpxorq zmm24{k5}, zmm24, [rbx]{1to8} vpxorq zmm24{k5}, zmm24, [rbx+r11*8+256] vpxorq zmm24{k5}, zmm24, [rbx+r11*8-256] vpxorq zmm24{k5}{z}, zmm24, zmm31 vpxorq zmm24{k5}{z}, zmm24, [rbx] vpxorq zmm24{k5}{z}, zmm24, [rbx]{1to8} vpxorq zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vpxorq zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vrcp14pd xmm2, xmm0 vrcp14pd xmm2, [rbx] vrcp14pd xmm2, [rbx]{1to2} vrcp14pd xmm2, [rbx+r11*8+256] vrcp14pd xmm2, [rbx+r11*8-256] vrcp14pd xmm2{k5}, xmm0 vrcp14pd xmm2{k5}, [rbx] vrcp14pd xmm2{k5}, [rbx]{1to2} vrcp14pd xmm2{k5}, [rbx+r11*8+256] vrcp14pd xmm2{k5}, [rbx+r11*8-256] vrcp14pd xmm2{k5}{z}, xmm0 vrcp14pd xmm2{k5}{z}, [rbx] vrcp14pd xmm2{k5}{z}, [rbx]{1to2} vrcp14pd xmm2{k5}{z}, [rbx+r11*8+256] vrcp14pd xmm2{k5}{z}, [rbx+r11*8-256] vrcp14pd ymm16, ymm15 vrcp14pd ymm16, [rbx] vrcp14pd ymm16, [rbx]{1to4} vrcp14pd ymm16, [rbx+r11*8+256] vrcp14pd ymm16, [rbx+r11*8-256] vrcp14pd ymm16{k5}, ymm15 vrcp14pd ymm16{k5}, [rbx] vrcp14pd ymm16{k5}, [rbx]{1to4} vrcp14pd ymm16{k5}, [rbx+r11*8+256] vrcp14pd ymm16{k5}, [rbx+r11*8-256] vrcp14pd ymm16{k5}{z}, ymm15 vrcp14pd ymm16{k5}{z}, [rbx] vrcp14pd ymm16{k5}{z}, [rbx]{1to4} vrcp14pd ymm16{k5}{z}, [rbx+r11*8+256] vrcp14pd ymm16{k5}{z}, [rbx+r11*8-256] vrcp14pd zmm24, zmm31 vrcp14pd zmm24, [rbx] vrcp14pd zmm24, [rbx]{1to8} vrcp14pd zmm24, [rbx+r11*8+256] vrcp14pd zmm24, [rbx+r11*8-256] vrcp14pd zmm24{k5}, zmm31 vrcp14pd zmm24{k5}, [rbx] vrcp14pd zmm24{k5}, [rbx]{1to8} vrcp14pd zmm24{k5}, [rbx+r11*8+256] vrcp14pd zmm24{k5}, [rbx+r11*8-256] vrcp14pd zmm24{k5}{z}, zmm31 vrcp14pd zmm24{k5}{z}, [rbx] vrcp14pd zmm24{k5}{z}, [rbx]{1to8} vrcp14pd zmm24{k5}{z}, [rbx+r11*8+256] vrcp14pd zmm24{k5}{z}, [rbx+r11*8-256] vrcp14ps xmm2, xmm0 vrcp14ps xmm2, [rbx] vrcp14ps xmm2, [rbx]{1to4} vrcp14ps xmm2, [rbx+r11*8+256] vrcp14ps xmm2, [rbx+r11*8-256] vrcp14ps xmm2{k5}, xmm0 vrcp14ps xmm2{k5}, [rbx] vrcp14ps xmm2{k5}, [rbx]{1to4} vrcp14ps xmm2{k5}, [rbx+r11*8+256] vrcp14ps xmm2{k5}, [rbx+r11*8-256] vrcp14ps xmm2{k5}{z}, xmm0 vrcp14ps xmm2{k5}{z}, [rbx] vrcp14ps xmm2{k5}{z}, [rbx]{1to4} vrcp14ps xmm2{k5}{z}, [rbx+r11*8+256] vrcp14ps xmm2{k5}{z}, [rbx+r11*8-256] vrcp14ps ymm16, ymm15 vrcp14ps ymm16, [rbx] vrcp14ps ymm16, [rbx]{1to8} vrcp14ps ymm16, [rbx+r11*8+256] vrcp14ps ymm16, [rbx+r11*8-256] vrcp14ps ymm16{k5}, ymm15 vrcp14ps ymm16{k5}, [rbx] vrcp14ps ymm16{k5}, [rbx]{1to8} vrcp14ps ymm16{k5}, [rbx+r11*8+256] vrcp14ps ymm16{k5}, [rbx+r11*8-256] vrcp14ps ymm16{k5}{z}, ymm15 vrcp14ps ymm16{k5}{z}, [rbx] vrcp14ps ymm16{k5}{z}, [rbx]{1to8} vrcp14ps ymm16{k5}{z}, [rbx+r11*8+256] vrcp14ps ymm16{k5}{z}, [rbx+r11*8-256] vrcp14ps zmm24, zmm31 vrcp14ps zmm24, [rbx] vrcp14ps zmm24, [rbx]{1to16} vrcp14ps zmm24, [rbx+r11*8+256] vrcp14ps zmm24, [rbx+r11*8-256] vrcp14ps zmm24{k5}, zmm31 vrcp14ps zmm24{k5}, [rbx] vrcp14ps zmm24{k5}, [rbx]{1to16} vrcp14ps zmm24{k5}, [rbx+r11*8+256] vrcp14ps zmm24{k5}, [rbx+r11*8-256] vrcp14ps zmm24{k5}{z}, zmm31 vrcp14ps zmm24{k5}{z}, [rbx] vrcp14ps zmm24{k5}{z}, [rbx]{1to16} vrcp14ps zmm24{k5}{z}, [rbx+r11*8+256] vrcp14ps zmm24{k5}{z}, [rbx+r11*8-256] vrcp14sd xmm2, xmm7, xmm0 vrcp14sd xmm2, xmm7, [rbx] vrcp14sd xmm2, xmm7, [rbx+r11*8+256] vrcp14sd xmm2, xmm7, [rbx+r11*8-256] vrcp14sd xmm2{k5}, xmm7, xmm0 vrcp14sd xmm2{k5}, xmm7, [rbx] vrcp14sd xmm2{k5}, xmm7, [rbx+r11*8+256] vrcp14sd xmm2{k5}, xmm7, [rbx+r11*8-256] vrcp14sd xmm2{k5}{z}, xmm7, xmm0 vrcp14sd xmm2{k5}{z}, xmm7, [rbx] vrcp14sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vrcp14sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vrcp14ss xmm2, xmm7, xmm0 vrcp14ss xmm2, xmm7, [rbx] vrcp14ss xmm2, xmm7, [rbx+r11*8+256] vrcp14ss xmm2, xmm7, [rbx+r11*8-256] vrcp14ss xmm2{k5}, xmm7, xmm0 vrcp14ss xmm2{k5}, xmm7, [rbx] vrcp14ss xmm2{k5}, xmm7, [rbx+r11*8+256] vrcp14ss xmm2{k5}, xmm7, [rbx+r11*8-256] vrcp14ss xmm2{k5}{z}, xmm7, xmm0 vrcp14ss xmm2{k5}{z}, xmm7, [rbx] vrcp14ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vrcp14ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vrndscalepd xmm2, xmm0, 10 vrndscalepd xmm2, [rbx], 10 vrndscalepd xmm2, [rbx]{1to2}, 10 vrndscalepd xmm2, [rbx+r11*8+256], 10 vrndscalepd xmm2, [rbx+r11*8-256], 10 vrndscalepd xmm2{k5}, xmm0, 10 vrndscalepd xmm2{k5}, [rbx], 10 vrndscalepd xmm2{k5}, [rbx]{1to2}, 10 vrndscalepd xmm2{k5}, [rbx+r11*8+256], 10 vrndscalepd xmm2{k5}, [rbx+r11*8-256], 10 vrndscalepd xmm2{k5}{z}, xmm0, 10 vrndscalepd xmm2{k5}{z}, [rbx], 10 vrndscalepd xmm2{k5}{z}, [rbx]{1to2}, 10 vrndscalepd xmm2{k5}{z}, [rbx+r11*8+256], 10 vrndscalepd xmm2{k5}{z}, [rbx+r11*8-256], 10 vrndscalepd ymm16, ymm15, 10 vrndscalepd ymm16, [rbx], 10 vrndscalepd ymm16, [rbx]{1to4}, 10 vrndscalepd ymm16, [rbx+r11*8+256], 10 vrndscalepd ymm16, [rbx+r11*8-256], 10 vrndscalepd ymm16{k5}, ymm15, 10 vrndscalepd ymm16{k5}, [rbx], 10 vrndscalepd ymm16{k5}, [rbx]{1to4}, 10 vrndscalepd ymm16{k5}, [rbx+r11*8+256], 10 vrndscalepd ymm16{k5}, [rbx+r11*8-256], 10 vrndscalepd ymm16{k5}{z}, ymm15, 10 vrndscalepd ymm16{k5}{z}, [rbx], 10 vrndscalepd ymm16{k5}{z}, [rbx]{1to4}, 10 vrndscalepd ymm16{k5}{z}, [rbx+r11*8+256], 10 vrndscalepd ymm16{k5}{z}, [rbx+r11*8-256], 10 vrndscalepd zmm24, zmm31, 10 vrndscalepd zmm24, [rbx], 10 vrndscalepd zmm24, [rbx]{1to8}, 10 vrndscalepd zmm24, [rbx+r11*8+256], 10 vrndscalepd zmm24, [rbx+r11*8-256], 10 vrndscalepd zmm24{k5}, zmm31, 10 vrndscalepd zmm24{k5}, [rbx], 10 vrndscalepd zmm24{k5}, [rbx]{1to8}, 10 vrndscalepd zmm24{k5}, [rbx+r11*8+256], 10 vrndscalepd zmm24{k5}, [rbx+r11*8-256], 10 vrndscalepd zmm24{k5}{z}, zmm31, 10 vrndscalepd zmm24{k5}{z}, [rbx], 10 vrndscalepd zmm24{k5}{z}, [rbx]{1to8}, 10 vrndscalepd zmm24{k5}{z}, [rbx+r11*8+256], 10 vrndscalepd zmm24{k5}{z}, [rbx+r11*8-256], 10 vrndscaleps xmm2, xmm0, 10 vrndscaleps xmm2, [rbx], 10 vrndscaleps xmm2, [rbx]{1to4}, 10 vrndscaleps xmm2, [rbx+r11*8+256], 10 vrndscaleps xmm2, [rbx+r11*8-256], 10 vrndscaleps xmm2{k5}, xmm0, 10 vrndscaleps xmm2{k5}, [rbx], 10 vrndscaleps xmm2{k5}, [rbx]{1to4}, 10 vrndscaleps xmm2{k5}, [rbx+r11*8+256], 10 vrndscaleps xmm2{k5}, [rbx+r11*8-256], 10 vrndscaleps xmm2{k5}{z}, xmm0, 10 vrndscaleps xmm2{k5}{z}, [rbx], 10 vrndscaleps xmm2{k5}{z}, [rbx]{1to4}, 10 vrndscaleps xmm2{k5}{z}, [rbx+r11*8+256], 10 vrndscaleps xmm2{k5}{z}, [rbx+r11*8-256], 10 vrndscaleps ymm16, ymm15, 10 vrndscaleps ymm16, [rbx], 10 vrndscaleps ymm16, [rbx]{1to8}, 10 vrndscaleps ymm16, [rbx+r11*8+256], 10 vrndscaleps ymm16, [rbx+r11*8-256], 10 vrndscaleps ymm16{k5}, ymm15, 10 vrndscaleps ymm16{k5}, [rbx], 10 vrndscaleps ymm16{k5}, [rbx]{1to8}, 10 vrndscaleps ymm16{k5}, [rbx+r11*8+256], 10 vrndscaleps ymm16{k5}, [rbx+r11*8-256], 10 vrndscaleps ymm16{k5}{z}, ymm15, 10 vrndscaleps ymm16{k5}{z}, [rbx], 10 vrndscaleps ymm16{k5}{z}, [rbx]{1to8}, 10 vrndscaleps ymm16{k5}{z}, [rbx+r11*8+256], 10 vrndscaleps ymm16{k5}{z}, [rbx+r11*8-256], 10 vrndscaleps zmm24, zmm31, 10 vrndscaleps zmm24, [rbx], 10 vrndscaleps zmm24, [rbx]{1to16}, 10 vrndscaleps zmm24, [rbx+r11*8+256], 10 vrndscaleps zmm24, [rbx+r11*8-256], 10 vrndscaleps zmm24{k5}, zmm31, 10 vrndscaleps zmm24{k5}, [rbx], 10 vrndscaleps zmm24{k5}, [rbx]{1to16}, 10 vrndscaleps zmm24{k5}, [rbx+r11*8+256], 10 vrndscaleps zmm24{k5}, [rbx+r11*8-256], 10 vrndscaleps zmm24{k5}{z}, zmm31, 10 vrndscaleps zmm24{k5}{z}, [rbx], 10 vrndscaleps zmm24{k5}{z}, [rbx]{1to16}, 10 vrndscaleps zmm24{k5}{z}, [rbx+r11*8+256], 10 vrndscaleps zmm24{k5}{z}, [rbx+r11*8-256], 10 vrndscalesd xmm2, xmm7, xmm0, 10 vrndscalesd xmm2, xmm7, [rbx], 10 vrndscalesd xmm2, xmm7, [rbx+r11*8+256], 10 vrndscalesd xmm2, xmm7, [rbx+r11*8-256], 10 vrndscalesd xmm2{k5}, xmm7, xmm0, 10 vrndscalesd xmm2{k5}, xmm7, [rbx], 10 vrndscalesd xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vrndscalesd xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vrndscalesd xmm2{k5}{z}, xmm7, xmm0, 10 vrndscalesd xmm2{k5}{z}, xmm7, [rbx], 10 vrndscalesd xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vrndscalesd xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vrndscaless xmm2, xmm7, xmm0, 10 vrndscaless xmm2, xmm7, [rbx], 10 vrndscaless xmm2, xmm7, [rbx+r11*8+256], 10 vrndscaless xmm2, xmm7, [rbx+r11*8-256], 10 vrndscaless xmm2{k5}, xmm7, xmm0, 10 vrndscaless xmm2{k5}, xmm7, [rbx], 10 vrndscaless xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vrndscaless xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vrndscaless xmm2{k5}{z}, xmm7, xmm0, 10 vrndscaless xmm2{k5}{z}, xmm7, [rbx], 10 vrndscaless xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vrndscaless xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vrsqrt14pd xmm2, xmm0 vrsqrt14pd xmm2, [rbx] vrsqrt14pd xmm2, [rbx]{1to2} vrsqrt14pd xmm2, [rbx+r11*8+256] vrsqrt14pd xmm2, [rbx+r11*8-256] vrsqrt14pd xmm2{k5}, xmm0 vrsqrt14pd xmm2{k5}, [rbx] vrsqrt14pd xmm2{k5}, [rbx]{1to2} vrsqrt14pd xmm2{k5}, [rbx+r11*8+256] vrsqrt14pd xmm2{k5}, [rbx+r11*8-256] vrsqrt14pd xmm2{k5}{z}, xmm0 vrsqrt14pd xmm2{k5}{z}, [rbx] vrsqrt14pd xmm2{k5}{z}, [rbx]{1to2} vrsqrt14pd xmm2{k5}{z}, [rbx+r11*8+256] vrsqrt14pd xmm2{k5}{z}, [rbx+r11*8-256] vrsqrt14pd ymm16, ymm15 vrsqrt14pd ymm16, [rbx] vrsqrt14pd ymm16, [rbx]{1to4} vrsqrt14pd ymm16, [rbx+r11*8+256] vrsqrt14pd ymm16, [rbx+r11*8-256] vrsqrt14pd ymm16{k5}, ymm15 vrsqrt14pd ymm16{k5}, [rbx] vrsqrt14pd ymm16{k5}, [rbx]{1to4} vrsqrt14pd ymm16{k5}, [rbx+r11*8+256] vrsqrt14pd ymm16{k5}, [rbx+r11*8-256] vrsqrt14pd ymm16{k5}{z}, ymm15 vrsqrt14pd ymm16{k5}{z}, [rbx] vrsqrt14pd ymm16{k5}{z}, [rbx]{1to4} vrsqrt14pd ymm16{k5}{z}, [rbx+r11*8+256] vrsqrt14pd ymm16{k5}{z}, [rbx+r11*8-256] vrsqrt14pd zmm24, zmm31 vrsqrt14pd zmm24, [rbx] vrsqrt14pd zmm24, [rbx]{1to8} vrsqrt14pd zmm24, [rbx+r11*8+256] vrsqrt14pd zmm24, [rbx+r11*8-256] vrsqrt14pd zmm24{k5}, zmm31 vrsqrt14pd zmm24{k5}, [rbx] vrsqrt14pd zmm24{k5}, [rbx]{1to8} vrsqrt14pd zmm24{k5}, [rbx+r11*8+256] vrsqrt14pd zmm24{k5}, [rbx+r11*8-256] vrsqrt14pd zmm24{k5}{z}, zmm31 vrsqrt14pd zmm24{k5}{z}, [rbx] vrsqrt14pd zmm24{k5}{z}, [rbx]{1to8} vrsqrt14pd zmm24{k5}{z}, [rbx+r11*8+256] vrsqrt14pd zmm24{k5}{z}, [rbx+r11*8-256] vrsqrt14ps xmm2, xmm0 vrsqrt14ps xmm2, [rbx] vrsqrt14ps xmm2, [rbx]{1to4} vrsqrt14ps xmm2, [rbx+r11*8+256] vrsqrt14ps xmm2, [rbx+r11*8-256] vrsqrt14ps xmm2{k5}, xmm0 vrsqrt14ps xmm2{k5}, [rbx] vrsqrt14ps xmm2{k5}, [rbx]{1to4} vrsqrt14ps xmm2{k5}, [rbx+r11*8+256] vrsqrt14ps xmm2{k5}, [rbx+r11*8-256] vrsqrt14ps xmm2{k5}{z}, xmm0 vrsqrt14ps xmm2{k5}{z}, [rbx] vrsqrt14ps xmm2{k5}{z}, [rbx]{1to4} vrsqrt14ps xmm2{k5}{z}, [rbx+r11*8+256] vrsqrt14ps xmm2{k5}{z}, [rbx+r11*8-256] vrsqrt14ps ymm16, ymm15 vrsqrt14ps ymm16, [rbx] vrsqrt14ps ymm16, [rbx]{1to8} vrsqrt14ps ymm16, [rbx+r11*8+256] vrsqrt14ps ymm16, [rbx+r11*8-256] vrsqrt14ps ymm16{k5}, ymm15 vrsqrt14ps ymm16{k5}, [rbx] vrsqrt14ps ymm16{k5}, [rbx]{1to8} vrsqrt14ps ymm16{k5}, [rbx+r11*8+256] vrsqrt14ps ymm16{k5}, [rbx+r11*8-256] vrsqrt14ps ymm16{k5}{z}, ymm15 vrsqrt14ps ymm16{k5}{z}, [rbx] vrsqrt14ps ymm16{k5}{z}, [rbx]{1to8} vrsqrt14ps ymm16{k5}{z}, [rbx+r11*8+256] vrsqrt14ps ymm16{k5}{z}, [rbx+r11*8-256] vrsqrt14ps zmm24, zmm31 vrsqrt14ps zmm24, [rbx] vrsqrt14ps zmm24, [rbx]{1to16} vrsqrt14ps zmm24, [rbx+r11*8+256] vrsqrt14ps zmm24, [rbx+r11*8-256] vrsqrt14ps zmm24{k5}, zmm31 vrsqrt14ps zmm24{k5}, [rbx] vrsqrt14ps zmm24{k5}, [rbx]{1to16} vrsqrt14ps zmm24{k5}, [rbx+r11*8+256] vrsqrt14ps zmm24{k5}, [rbx+r11*8-256] vrsqrt14ps zmm24{k5}{z}, zmm31 vrsqrt14ps zmm24{k5}{z}, [rbx] vrsqrt14ps zmm24{k5}{z}, [rbx]{1to16} vrsqrt14ps zmm24{k5}{z}, [rbx+r11*8+256] vrsqrt14ps zmm24{k5}{z}, [rbx+r11*8-256] vrsqrt14sd xmm2, xmm7, xmm0 vrsqrt14sd xmm2, xmm7, [rbx] vrsqrt14sd xmm2, xmm7, [rbx+r11*8+256] vrsqrt14sd xmm2, xmm7, [rbx+r11*8-256] vrsqrt14sd xmm2{k5}, xmm7, xmm0 vrsqrt14sd xmm2{k5}, xmm7, [rbx] vrsqrt14sd xmm2{k5}, xmm7, [rbx+r11*8+256] vrsqrt14sd xmm2{k5}, xmm7, [rbx+r11*8-256] vrsqrt14sd xmm2{k5}{z}, xmm7, xmm0 vrsqrt14sd xmm2{k5}{z}, xmm7, [rbx] vrsqrt14sd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vrsqrt14sd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vrsqrt14ss xmm2, xmm7, xmm0 vrsqrt14ss xmm2, xmm7, [rbx] vrsqrt14ss xmm2, xmm7, [rbx+r11*8+256] vrsqrt14ss xmm2, xmm7, [rbx+r11*8-256] vrsqrt14ss xmm2{k5}, xmm7, xmm0 vrsqrt14ss xmm2{k5}, xmm7, [rbx] vrsqrt14ss xmm2{k5}, xmm7, [rbx+r11*8+256] vrsqrt14ss xmm2{k5}, xmm7, [rbx+r11*8-256] vrsqrt14ss xmm2{k5}{z}, xmm7, xmm0 vrsqrt14ss xmm2{k5}{z}, xmm7, [rbx] vrsqrt14ss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vrsqrt14ss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vscalefpd xmm2, xmm7, xmm0 vscalefpd xmm2, xmm7, [rbx] vscalefpd xmm2, xmm7, [rbx]{1to2} vscalefpd xmm2, xmm7, [rbx+r11*8+256] vscalefpd xmm2, xmm7, [rbx+r11*8-256] vscalefpd xmm2{k5}, xmm7, xmm0 vscalefpd xmm2{k5}, xmm7, [rbx] vscalefpd xmm2{k5}, xmm7, [rbx]{1to2} vscalefpd xmm2{k5}, xmm7, [rbx+r11*8+256] vscalefpd xmm2{k5}, xmm7, [rbx+r11*8-256] vscalefpd xmm2{k5}{z}, xmm7, xmm0 vscalefpd xmm2{k5}{z}, xmm7, [rbx] vscalefpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vscalefpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vscalefpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vscalefpd ymm16, ymm13, ymm15 vscalefpd ymm16, ymm13, [rbx] vscalefpd ymm16, ymm13, [rbx]{1to4} vscalefpd ymm16, ymm13, [rbx+r11*8+256] vscalefpd ymm16, ymm13, [rbx+r11*8-256] vscalefpd ymm16{k5}, ymm13, ymm15 vscalefpd ymm16{k5}, ymm13, [rbx] vscalefpd ymm16{k5}, ymm13, [rbx]{1to4} vscalefpd ymm16{k5}, ymm13, [rbx+r11*8+256] vscalefpd ymm16{k5}, ymm13, [rbx+r11*8-256] vscalefpd ymm16{k5}{z}, ymm13, ymm15 vscalefpd ymm16{k5}{z}, ymm13, [rbx] vscalefpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vscalefpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vscalefpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vscalefpd zmm24, zmm24, zmm31 vscalefpd zmm24, zmm24, zmm31, {rd-sae} vscalefpd zmm24, zmm24, [rbx] vscalefpd zmm24, zmm24, [rbx]{1to8} vscalefpd zmm24, zmm24, [rbx+r11*8+256] vscalefpd zmm24, zmm24, [rbx+r11*8-256] vscalefpd zmm24{k5}, zmm24, zmm31 vscalefpd zmm24{k5}, zmm24, zmm31, {rd-sae} vscalefpd zmm24{k5}, zmm24, [rbx] vscalefpd zmm24{k5}, zmm24, [rbx]{1to8} vscalefpd zmm24{k5}, zmm24, [rbx+r11*8+256] vscalefpd zmm24{k5}, zmm24, [rbx+r11*8-256] vscalefpd zmm24{k5}{z}, zmm24, zmm31 vscalefpd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vscalefpd zmm24{k5}{z}, zmm24, [rbx] vscalefpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vscalefpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vscalefpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vscalefps xmm2, xmm7, xmm0 vscalefps xmm2, xmm7, [rbx] vscalefps xmm2, xmm7, [rbx]{1to4} vscalefps xmm2, xmm7, [rbx+r11*8+256] vscalefps xmm2, xmm7, [rbx+r11*8-256] vscalefps xmm2{k5}, xmm7, xmm0 vscalefps xmm2{k5}, xmm7, [rbx] vscalefps xmm2{k5}, xmm7, [rbx]{1to4} vscalefps xmm2{k5}, xmm7, [rbx+r11*8+256] vscalefps xmm2{k5}, xmm7, [rbx+r11*8-256] vscalefps xmm2{k5}{z}, xmm7, xmm0 vscalefps xmm2{k5}{z}, xmm7, [rbx] vscalefps xmm2{k5}{z}, xmm7, [rbx]{1to4} vscalefps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vscalefps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vscalefps ymm16, ymm13, ymm15 vscalefps ymm16, ymm13, [rbx] vscalefps ymm16, ymm13, [rbx]{1to8} vscalefps ymm16, ymm13, [rbx+r11*8+256] vscalefps ymm16, ymm13, [rbx+r11*8-256] vscalefps ymm16{k5}, ymm13, ymm15 vscalefps ymm16{k5}, ymm13, [rbx] vscalefps ymm16{k5}, ymm13, [rbx]{1to8} vscalefps ymm16{k5}, ymm13, [rbx+r11*8+256] vscalefps ymm16{k5}, ymm13, [rbx+r11*8-256] vscalefps ymm16{k5}{z}, ymm13, ymm15 vscalefps ymm16{k5}{z}, ymm13, [rbx] vscalefps ymm16{k5}{z}, ymm13, [rbx]{1to8} vscalefps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vscalefps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vscalefps zmm24, zmm24, zmm31 vscalefps zmm24, zmm24, zmm31, {rd-sae} vscalefps zmm24, zmm24, [rbx] vscalefps zmm24, zmm24, [rbx]{1to16} vscalefps zmm24, zmm24, [rbx+r11*8+256] vscalefps zmm24, zmm24, [rbx+r11*8-256] vscalefps zmm24{k5}, zmm24, zmm31 vscalefps zmm24{k5}, zmm24, zmm31, {rd-sae} vscalefps zmm24{k5}, zmm24, [rbx] vscalefps zmm24{k5}, zmm24, [rbx]{1to16} vscalefps zmm24{k5}, zmm24, [rbx+r11*8+256] vscalefps zmm24{k5}, zmm24, [rbx+r11*8-256] vscalefps zmm24{k5}{z}, zmm24, zmm31 vscalefps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vscalefps zmm24{k5}{z}, zmm24, [rbx] vscalefps zmm24{k5}{z}, zmm24, [rbx]{1to16} vscalefps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vscalefps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vscalefsd xmm2, xmm7, xmm0 vscalefsd xmm2, xmm7, xmm0, {rd-sae} vscalefsd xmm2, xmm7, [rbx] vscalefsd xmm2, xmm7, [rbx+r11*8+256] vscalefsd xmm2, xmm7, [rbx+r11*8-256] vscalefsd xmm2{k5}, xmm7, xmm0 vscalefsd xmm2{k5}, xmm7, xmm0, {rd-sae} vscalefsd xmm2{k5}, xmm7, [rbx] vscalefsd xmm2{k5}, xmm7, [rbx+r11*8+256] vscalefsd xmm2{k5}, xmm7, [rbx+r11*8-256] vscalefsd xmm2{k5}{z}, xmm7, xmm0 vscalefsd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vscalefsd xmm2{k5}{z}, xmm7, [rbx] vscalefsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vscalefsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vscalefss xmm2, xmm7, xmm0 vscalefss xmm2, xmm7, xmm0, {rd-sae} vscalefss xmm2, xmm7, [rbx] vscalefss xmm2, xmm7, [rbx+r11*8+256] vscalefss xmm2, xmm7, [rbx+r11*8-256] vscalefss xmm2{k5}, xmm7, xmm0 vscalefss xmm2{k5}, xmm7, xmm0, {rd-sae} vscalefss xmm2{k5}, xmm7, [rbx] vscalefss xmm2{k5}, xmm7, [rbx+r11*8+256] vscalefss xmm2{k5}, xmm7, [rbx+r11*8-256] vscalefss xmm2{k5}{z}, xmm7, xmm0 vscalefss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vscalefss xmm2{k5}{z}, xmm7, [rbx] vscalefss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vscalefss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vshuff32x4 ymm16, ymm13, ymm15, 10 vshuff32x4 ymm16, ymm13, [rbx], 10 vshuff32x4 ymm16, ymm13, [rbx]{1to8}, 10 vshuff32x4 ymm16, ymm13, [rbx+r11*8+256], 10 vshuff32x4 ymm16, ymm13, [rbx+r11*8-256], 10 vshuff32x4 ymm16{k5}, ymm13, ymm15, 10 vshuff32x4 ymm16{k5}, ymm13, [rbx], 10 vshuff32x4 ymm16{k5}, ymm13, [rbx]{1to8}, 10 vshuff32x4 ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vshuff32x4 ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vshuff32x4 ymm16{k5}{z}, ymm13, ymm15, 10 vshuff32x4 ymm16{k5}{z}, ymm13, [rbx], 10 vshuff32x4 ymm16{k5}{z}, ymm13, [rbx]{1to8}, 10 vshuff32x4 ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vshuff32x4 ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vshuff32x4 zmm24, zmm24, zmm31, 10 vshuff32x4 zmm24, zmm24, [rbx], 10 vshuff32x4 zmm24, zmm24, [rbx]{1to16}, 10 vshuff32x4 zmm24, zmm24, [rbx+r11*8+256], 10 vshuff32x4 zmm24, zmm24, [rbx+r11*8-256], 10 vshuff32x4 zmm24{k5}, zmm24, zmm31, 10 vshuff32x4 zmm24{k5}, zmm24, [rbx], 10 vshuff32x4 zmm24{k5}, zmm24, [rbx]{1to16}, 10 vshuff32x4 zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vshuff32x4 zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vshuff32x4 zmm24{k5}{z}, zmm24, zmm31, 10 vshuff32x4 zmm24{k5}{z}, zmm24, [rbx], 10 vshuff32x4 zmm24{k5}{z}, zmm24, [rbx]{1to16}, 10 vshuff32x4 zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vshuff32x4 zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vshuff64x2 ymm16, ymm13, ymm15, 10 vshuff64x2 ymm16, ymm13, [rbx], 10 vshuff64x2 ymm16, ymm13, [rbx]{1to4}, 10 vshuff64x2 ymm16, ymm13, [rbx+r11*8+256], 10 vshuff64x2 ymm16, ymm13, [rbx+r11*8-256], 10 vshuff64x2 ymm16{k5}, ymm13, ymm15, 10 vshuff64x2 ymm16{k5}, ymm13, [rbx], 10 vshuff64x2 ymm16{k5}, ymm13, [rbx]{1to4}, 10 vshuff64x2 ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vshuff64x2 ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vshuff64x2 ymm16{k5}{z}, ymm13, ymm15, 10 vshuff64x2 ymm16{k5}{z}, ymm13, [rbx], 10 vshuff64x2 ymm16{k5}{z}, ymm13, [rbx]{1to4}, 10 vshuff64x2 ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vshuff64x2 ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vshuff64x2 zmm24, zmm24, zmm31, 10 vshuff64x2 zmm24, zmm24, [rbx], 10 vshuff64x2 zmm24, zmm24, [rbx]{1to8}, 10 vshuff64x2 zmm24, zmm24, [rbx+r11*8+256], 10 vshuff64x2 zmm24, zmm24, [rbx+r11*8-256], 10 vshuff64x2 zmm24{k5}, zmm24, zmm31, 10 vshuff64x2 zmm24{k5}, zmm24, [rbx], 10 vshuff64x2 zmm24{k5}, zmm24, [rbx]{1to8}, 10 vshuff64x2 zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vshuff64x2 zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vshuff64x2 zmm24{k5}{z}, zmm24, zmm31, 10 vshuff64x2 zmm24{k5}{z}, zmm24, [rbx], 10 vshuff64x2 zmm24{k5}{z}, zmm24, [rbx]{1to8}, 10 vshuff64x2 zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vshuff64x2 zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vshufi32x4 ymm16, ymm13, ymm15, 10 vshufi32x4 ymm16, ymm13, [rbx], 10 vshufi32x4 ymm16, ymm13, [rbx]{1to8}, 10 vshufi32x4 ymm16, ymm13, [rbx+r11*8+256], 10 vshufi32x4 ymm16, ymm13, [rbx+r11*8-256], 10 vshufi32x4 ymm16{k5}, ymm13, ymm15, 10 vshufi32x4 ymm16{k5}, ymm13, [rbx], 10 vshufi32x4 ymm16{k5}, ymm13, [rbx]{1to8}, 10 vshufi32x4 ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vshufi32x4 ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vshufi32x4 ymm16{k5}{z}, ymm13, ymm15, 10 vshufi32x4 ymm16{k5}{z}, ymm13, [rbx], 10 vshufi32x4 ymm16{k5}{z}, ymm13, [rbx]{1to8}, 10 vshufi32x4 ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vshufi32x4 ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vshufi32x4 zmm24, zmm24, zmm31, 10 vshufi32x4 zmm24, zmm24, [rbx], 10 vshufi32x4 zmm24, zmm24, [rbx]{1to16}, 10 vshufi32x4 zmm24, zmm24, [rbx+r11*8+256], 10 vshufi32x4 zmm24, zmm24, [rbx+r11*8-256], 10 vshufi32x4 zmm24{k5}, zmm24, zmm31, 10 vshufi32x4 zmm24{k5}, zmm24, [rbx], 10 vshufi32x4 zmm24{k5}, zmm24, [rbx]{1to16}, 10 vshufi32x4 zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vshufi32x4 zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vshufi32x4 zmm24{k5}{z}, zmm24, zmm31, 10 vshufi32x4 zmm24{k5}{z}, zmm24, [rbx], 10 vshufi32x4 zmm24{k5}{z}, zmm24, [rbx]{1to16}, 10 vshufi32x4 zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vshufi32x4 zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vshufi64x2 ymm16, ymm13, ymm15, 10 vshufi64x2 ymm16, ymm13, [rbx], 10 vshufi64x2 ymm16, ymm13, [rbx]{1to4}, 10 vshufi64x2 ymm16, ymm13, [rbx+r11*8+256], 10 vshufi64x2 ymm16, ymm13, [rbx+r11*8-256], 10 vshufi64x2 ymm16{k5}, ymm13, ymm15, 10 vshufi64x2 ymm16{k5}, ymm13, [rbx], 10 vshufi64x2 ymm16{k5}, ymm13, [rbx]{1to4}, 10 vshufi64x2 ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vshufi64x2 ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vshufi64x2 ymm16{k5}{z}, ymm13, ymm15, 10 vshufi64x2 ymm16{k5}{z}, ymm13, [rbx], 10 vshufi64x2 ymm16{k5}{z}, ymm13, [rbx]{1to4}, 10 vshufi64x2 ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vshufi64x2 ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vshufi64x2 zmm24, zmm24, zmm31, 10 vshufi64x2 zmm24, zmm24, [rbx], 10 vshufi64x2 zmm24, zmm24, [rbx]{1to8}, 10 vshufi64x2 zmm24, zmm24, [rbx+r11*8+256], 10 vshufi64x2 zmm24, zmm24, [rbx+r11*8-256], 10 vshufi64x2 zmm24{k5}, zmm24, zmm31, 10 vshufi64x2 zmm24{k5}, zmm24, [rbx], 10 vshufi64x2 zmm24{k5}, zmm24, [rbx]{1to8}, 10 vshufi64x2 zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vshufi64x2 zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vshufi64x2 zmm24{k5}{z}, zmm24, zmm31, 10 vshufi64x2 zmm24{k5}{z}, zmm24, [rbx], 10 vshufi64x2 zmm24{k5}{z}, zmm24, [rbx]{1to8}, 10 vshufi64x2 zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vshufi64x2 zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vshufpd xmm2, xmm7, xmm0, 10 vshufpd xmm2, xmm7, [rbx], 10 vshufpd xmm2, xmm7, [rbx]{1to2}, 10 vshufpd xmm2, xmm7, [rbx+r11*8+256], 10 vshufpd xmm2, xmm7, [rbx+r11*8-256], 10 vshufpd xmm2{k5}, xmm7, xmm0, 10 vshufpd xmm2{k5}, xmm7, [rbx], 10 vshufpd xmm2{k5}, xmm7, [rbx]{1to2}, 10 vshufpd xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vshufpd xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vshufpd xmm2{k5}{z}, xmm7, xmm0, 10 vshufpd xmm2{k5}{z}, xmm7, [rbx], 10 vshufpd xmm2{k5}{z}, xmm7, [rbx]{1to2}, 10 vshufpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vshufpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vshufpd ymm16, ymm13, ymm15, 10 vshufpd ymm16, ymm13, [rbx], 10 vshufpd ymm16, ymm13, [rbx]{1to4}, 10 vshufpd ymm16, ymm13, [rbx+r11*8+256], 10 vshufpd ymm16, ymm13, [rbx+r11*8-256], 10 vshufpd ymm16{k5}, ymm13, ymm15, 10 vshufpd ymm16{k5}, ymm13, [rbx], 10 vshufpd ymm16{k5}, ymm13, [rbx]{1to4}, 10 vshufpd ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vshufpd ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vshufpd ymm16{k5}{z}, ymm13, ymm15, 10 vshufpd ymm16{k5}{z}, ymm13, [rbx], 10 vshufpd ymm16{k5}{z}, ymm13, [rbx]{1to4}, 10 vshufpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vshufpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vshufpd zmm24, zmm24, zmm31, 10 vshufpd zmm24, zmm24, [rbx], 10 vshufpd zmm24, zmm24, [rbx]{1to8}, 10 vshufpd zmm24, zmm24, [rbx+r11*8+256], 10 vshufpd zmm24, zmm24, [rbx+r11*8-256], 10 vshufpd zmm24{k5}, zmm24, zmm31, 10 vshufpd zmm24{k5}, zmm24, [rbx], 10 vshufpd zmm24{k5}, zmm24, [rbx]{1to8}, 10 vshufpd zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vshufpd zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vshufpd zmm24{k5}{z}, zmm24, zmm31, 10 vshufpd zmm24{k5}{z}, zmm24, [rbx], 10 vshufpd zmm24{k5}{z}, zmm24, [rbx]{1to8}, 10 vshufpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vshufpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vshufps xmm2, xmm7, xmm0, 10 vshufps xmm2, xmm7, [rbx], 10 vshufps xmm2, xmm7, [rbx]{1to4}, 10 vshufps xmm2, xmm7, [rbx+r11*8+256], 10 vshufps xmm2, xmm7, [rbx+r11*8-256], 10 vshufps xmm2{k5}, xmm7, xmm0, 10 vshufps xmm2{k5}, xmm7, [rbx], 10 vshufps xmm2{k5}, xmm7, [rbx]{1to4}, 10 vshufps xmm2{k5}, xmm7, [rbx+r11*8+256], 10 vshufps xmm2{k5}, xmm7, [rbx+r11*8-256], 10 vshufps xmm2{k5}{z}, xmm7, xmm0, 10 vshufps xmm2{k5}{z}, xmm7, [rbx], 10 vshufps xmm2{k5}{z}, xmm7, [rbx]{1to4}, 10 vshufps xmm2{k5}{z}, xmm7, [rbx+r11*8+256], 10 vshufps xmm2{k5}{z}, xmm7, [rbx+r11*8-256], 10 vshufps ymm16, ymm13, ymm15, 10 vshufps ymm16, ymm13, [rbx], 10 vshufps ymm16, ymm13, [rbx]{1to8}, 10 vshufps ymm16, ymm13, [rbx+r11*8+256], 10 vshufps ymm16, ymm13, [rbx+r11*8-256], 10 vshufps ymm16{k5}, ymm13, ymm15, 10 vshufps ymm16{k5}, ymm13, [rbx], 10 vshufps ymm16{k5}, ymm13, [rbx]{1to8}, 10 vshufps ymm16{k5}, ymm13, [rbx+r11*8+256], 10 vshufps ymm16{k5}, ymm13, [rbx+r11*8-256], 10 vshufps ymm16{k5}{z}, ymm13, ymm15, 10 vshufps ymm16{k5}{z}, ymm13, [rbx], 10 vshufps ymm16{k5}{z}, ymm13, [rbx]{1to8}, 10 vshufps ymm16{k5}{z}, ymm13, [rbx+r11*8+256], 10 vshufps ymm16{k5}{z}, ymm13, [rbx+r11*8-256], 10 vshufps zmm24, zmm24, zmm31, 10 vshufps zmm24, zmm24, [rbx], 10 vshufps zmm24, zmm24, [rbx]{1to16}, 10 vshufps zmm24, zmm24, [rbx+r11*8+256], 10 vshufps zmm24, zmm24, [rbx+r11*8-256], 10 vshufps zmm24{k5}, zmm24, zmm31, 10 vshufps zmm24{k5}, zmm24, [rbx], 10 vshufps zmm24{k5}, zmm24, [rbx]{1to16}, 10 vshufps zmm24{k5}, zmm24, [rbx+r11*8+256], 10 vshufps zmm24{k5}, zmm24, [rbx+r11*8-256], 10 vshufps zmm24{k5}{z}, zmm24, zmm31, 10 vshufps zmm24{k5}{z}, zmm24, [rbx], 10 vshufps zmm24{k5}{z}, zmm24, [rbx]{1to16}, 10 vshufps zmm24{k5}{z}, zmm24, [rbx+r11*8+256], 10 vshufps zmm24{k5}{z}, zmm24, [rbx+r11*8-256], 10 vsqrtpd xmm2, xmm0 vsqrtpd xmm2, [rbx] vsqrtpd xmm2, [rbx]{1to2} vsqrtpd xmm2, [rbx+r11*8+256] vsqrtpd xmm2, [rbx+r11*8-256] vsqrtpd xmm2{k5}, xmm0 vsqrtpd xmm2{k5}, [rbx] vsqrtpd xmm2{k5}, [rbx]{1to2} vsqrtpd xmm2{k5}, [rbx+r11*8+256] vsqrtpd xmm2{k5}, [rbx+r11*8-256] vsqrtpd xmm2{k5}{z}, xmm0 vsqrtpd xmm2{k5}{z}, [rbx] vsqrtpd xmm2{k5}{z}, [rbx]{1to2} vsqrtpd xmm2{k5}{z}, [rbx+r11*8+256] vsqrtpd xmm2{k5}{z}, [rbx+r11*8-256] vsqrtpd ymm16, ymm15 vsqrtpd ymm16, [rbx] vsqrtpd ymm16, [rbx]{1to4} vsqrtpd ymm16, [rbx+r11*8+256] vsqrtpd ymm16, [rbx+r11*8-256] vsqrtpd ymm16{k5}, ymm15 vsqrtpd ymm16{k5}, [rbx] vsqrtpd ymm16{k5}, [rbx]{1to4} vsqrtpd ymm16{k5}, [rbx+r11*8+256] vsqrtpd ymm16{k5}, [rbx+r11*8-256] vsqrtpd ymm16{k5}{z}, ymm15 vsqrtpd ymm16{k5}{z}, [rbx] vsqrtpd ymm16{k5}{z}, [rbx]{1to4} vsqrtpd ymm16{k5}{z}, [rbx+r11*8+256] vsqrtpd ymm16{k5}{z}, [rbx+r11*8-256] vsqrtpd zmm24, zmm31 vsqrtpd zmm24, zmm31, {rd-sae} vsqrtpd zmm24, [rbx] vsqrtpd zmm24, [rbx]{1to8} vsqrtpd zmm24, [rbx+r11*8+256] vsqrtpd zmm24, [rbx+r11*8-256] vsqrtpd zmm24{k5}, zmm31 vsqrtpd zmm24{k5}, zmm31, {rd-sae} vsqrtpd zmm24{k5}, [rbx] vsqrtpd zmm24{k5}, [rbx]{1to8} vsqrtpd zmm24{k5}, [rbx+r11*8+256] vsqrtpd zmm24{k5}, [rbx+r11*8-256] vsqrtpd zmm24{k5}{z}, zmm31 vsqrtpd zmm24{k5}{z}, zmm31, {rd-sae} vsqrtpd zmm24{k5}{z}, [rbx] vsqrtpd zmm24{k5}{z}, [rbx]{1to8} vsqrtpd zmm24{k5}{z}, [rbx+r11*8+256] vsqrtpd zmm24{k5}{z}, [rbx+r11*8-256] vsqrtps xmm2, xmm0 vsqrtps xmm2, [rbx] vsqrtps xmm2, [rbx]{1to4} vsqrtps xmm2, [rbx+r11*8+256] vsqrtps xmm2, [rbx+r11*8-256] vsqrtps xmm2{k5}, xmm0 vsqrtps xmm2{k5}, [rbx] vsqrtps xmm2{k5}, [rbx]{1to4} vsqrtps xmm2{k5}, [rbx+r11*8+256] vsqrtps xmm2{k5}, [rbx+r11*8-256] vsqrtps xmm2{k5}{z}, xmm0 vsqrtps xmm2{k5}{z}, [rbx] vsqrtps xmm2{k5}{z}, [rbx]{1to4} vsqrtps xmm2{k5}{z}, [rbx+r11*8+256] vsqrtps xmm2{k5}{z}, [rbx+r11*8-256] vsqrtps ymm16, ymm15 vsqrtps ymm16, [rbx] vsqrtps ymm16, [rbx]{1to8} vsqrtps ymm16, [rbx+r11*8+256] vsqrtps ymm16, [rbx+r11*8-256] vsqrtps ymm16{k5}, ymm15 vsqrtps ymm16{k5}, [rbx] vsqrtps ymm16{k5}, [rbx]{1to8} vsqrtps ymm16{k5}, [rbx+r11*8+256] vsqrtps ymm16{k5}, [rbx+r11*8-256] vsqrtps ymm16{k5}{z}, ymm15 vsqrtps ymm16{k5}{z}, [rbx] vsqrtps ymm16{k5}{z}, [rbx]{1to8} vsqrtps ymm16{k5}{z}, [rbx+r11*8+256] vsqrtps ymm16{k5}{z}, [rbx+r11*8-256] vsqrtps zmm24, zmm31 vsqrtps zmm24, zmm31, {rd-sae} vsqrtps zmm24, [rbx] vsqrtps zmm24, [rbx]{1to16} vsqrtps zmm24, [rbx+r11*8+256] vsqrtps zmm24, [rbx+r11*8-256] vsqrtps zmm24{k5}, zmm31 vsqrtps zmm24{k5}, zmm31, {rd-sae} vsqrtps zmm24{k5}, [rbx] vsqrtps zmm24{k5}, [rbx]{1to16} vsqrtps zmm24{k5}, [rbx+r11*8+256] vsqrtps zmm24{k5}, [rbx+r11*8-256] vsqrtps zmm24{k5}{z}, zmm31 vsqrtps zmm24{k5}{z}, zmm31, {rd-sae} vsqrtps zmm24{k5}{z}, [rbx] vsqrtps zmm24{k5}{z}, [rbx]{1to16} vsqrtps zmm24{k5}{z}, [rbx+r11*8+256] vsqrtps zmm24{k5}{z}, [rbx+r11*8-256] vsqrtsd xmm2, xmm7, xmm0 vsqrtsd xmm2, xmm7, xmm0, {rd-sae} vsqrtsd xmm2, xmm7, [rbx] vsqrtsd xmm2, xmm7, [rbx+r11*8+256] vsqrtsd xmm2, xmm7, [rbx+r11*8-256] vsqrtsd xmm2{k5}, xmm7, xmm0 vsqrtsd xmm2{k5}, xmm7, xmm0, {rd-sae} vsqrtsd xmm2{k5}, xmm7, [rbx] vsqrtsd xmm2{k5}, xmm7, [rbx+r11*8+256] vsqrtsd xmm2{k5}, xmm7, [rbx+r11*8-256] vsqrtsd xmm2{k5}{z}, xmm7, xmm0 vsqrtsd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vsqrtsd xmm2{k5}{z}, xmm7, [rbx] vsqrtsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vsqrtsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vsqrtss xmm2, xmm7, xmm0 vsqrtss xmm2, xmm7, xmm0, {rd-sae} vsqrtss xmm2, xmm7, [rbx] vsqrtss xmm2, xmm7, [rbx+r11*8+256] vsqrtss xmm2, xmm7, [rbx+r11*8-256] vsqrtss xmm2{k5}, xmm7, xmm0 vsqrtss xmm2{k5}, xmm7, xmm0, {rd-sae} vsqrtss xmm2{k5}, xmm7, [rbx] vsqrtss xmm2{k5}, xmm7, [rbx+r11*8+256] vsqrtss xmm2{k5}, xmm7, [rbx+r11*8-256] vsqrtss xmm2{k5}{z}, xmm7, xmm0 vsqrtss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vsqrtss xmm2{k5}{z}, xmm7, [rbx] vsqrtss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vsqrtss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vsubpd xmm2, xmm7, xmm0 vsubpd xmm2, xmm7, [rbx] vsubpd xmm2, xmm7, [rbx]{1to2} vsubpd xmm2, xmm7, [rbx+r11*8+256] vsubpd xmm2, xmm7, [rbx+r11*8-256] vsubpd xmm2{k5}, xmm7, xmm0 vsubpd xmm2{k5}, xmm7, [rbx] vsubpd xmm2{k5}, xmm7, [rbx]{1to2} vsubpd xmm2{k5}, xmm7, [rbx+r11*8+256] vsubpd xmm2{k5}, xmm7, [rbx+r11*8-256] vsubpd xmm2{k5}{z}, xmm7, xmm0 vsubpd xmm2{k5}{z}, xmm7, [rbx] vsubpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vsubpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vsubpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vsubpd ymm16, ymm13, ymm15 vsubpd ymm16, ymm13, [rbx] vsubpd ymm16, ymm13, [rbx]{1to4} vsubpd ymm16, ymm13, [rbx+r11*8+256] vsubpd ymm16, ymm13, [rbx+r11*8-256] vsubpd ymm16{k5}, ymm13, ymm15 vsubpd ymm16{k5}, ymm13, [rbx] vsubpd ymm16{k5}, ymm13, [rbx]{1to4} vsubpd ymm16{k5}, ymm13, [rbx+r11*8+256] vsubpd ymm16{k5}, ymm13, [rbx+r11*8-256] vsubpd ymm16{k5}{z}, ymm13, ymm15 vsubpd ymm16{k5}{z}, ymm13, [rbx] vsubpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vsubpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vsubpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vsubpd zmm24, zmm24, zmm31 vsubpd zmm24, zmm24, zmm31, {rd-sae} vsubpd zmm24, zmm24, [rbx] vsubpd zmm24, zmm24, [rbx]{1to8} vsubpd zmm24, zmm24, [rbx+r11*8+256] vsubpd zmm24, zmm24, [rbx+r11*8-256] vsubpd zmm24{k5}, zmm24, zmm31 vsubpd zmm24{k5}, zmm24, zmm31, {rd-sae} vsubpd zmm24{k5}, zmm24, [rbx] vsubpd zmm24{k5}, zmm24, [rbx]{1to8} vsubpd zmm24{k5}, zmm24, [rbx+r11*8+256] vsubpd zmm24{k5}, zmm24, [rbx+r11*8-256] vsubpd zmm24{k5}{z}, zmm24, zmm31 vsubpd zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vsubpd zmm24{k5}{z}, zmm24, [rbx] vsubpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vsubpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vsubpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vsubps xmm2, xmm7, xmm0 vsubps xmm2, xmm7, [rbx] vsubps xmm2, xmm7, [rbx]{1to4} vsubps xmm2, xmm7, [rbx+r11*8+256] vsubps xmm2, xmm7, [rbx+r11*8-256] vsubps xmm2{k5}, xmm7, xmm0 vsubps xmm2{k5}, xmm7, [rbx] vsubps xmm2{k5}, xmm7, [rbx]{1to4} vsubps xmm2{k5}, xmm7, [rbx+r11*8+256] vsubps xmm2{k5}, xmm7, [rbx+r11*8-256] vsubps xmm2{k5}{z}, xmm7, xmm0 vsubps xmm2{k5}{z}, xmm7, [rbx] vsubps xmm2{k5}{z}, xmm7, [rbx]{1to4} vsubps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vsubps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vsubps ymm16, ymm13, ymm15 vsubps ymm16, ymm13, [rbx] vsubps ymm16, ymm13, [rbx]{1to8} vsubps ymm16, ymm13, [rbx+r11*8+256] vsubps ymm16, ymm13, [rbx+r11*8-256] vsubps ymm16{k5}, ymm13, ymm15 vsubps ymm16{k5}, ymm13, [rbx] vsubps ymm16{k5}, ymm13, [rbx]{1to8} vsubps ymm16{k5}, ymm13, [rbx+r11*8+256] vsubps ymm16{k5}, ymm13, [rbx+r11*8-256] vsubps ymm16{k5}{z}, ymm13, ymm15 vsubps ymm16{k5}{z}, ymm13, [rbx] vsubps ymm16{k5}{z}, ymm13, [rbx]{1to8} vsubps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vsubps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vsubps zmm24, zmm24, zmm31 vsubps zmm24, zmm24, zmm31, {rd-sae} vsubps zmm24, zmm24, [rbx] vsubps zmm24, zmm24, [rbx]{1to16} vsubps zmm24, zmm24, [rbx+r11*8+256] vsubps zmm24, zmm24, [rbx+r11*8-256] vsubps zmm24{k5}, zmm24, zmm31 vsubps zmm24{k5}, zmm24, zmm31, {rd-sae} vsubps zmm24{k5}, zmm24, [rbx] vsubps zmm24{k5}, zmm24, [rbx]{1to16} vsubps zmm24{k5}, zmm24, [rbx+r11*8+256] vsubps zmm24{k5}, zmm24, [rbx+r11*8-256] vsubps zmm24{k5}{z}, zmm24, zmm31 vsubps zmm24{k5}{z}, zmm24, zmm31, {rd-sae} vsubps zmm24{k5}{z}, zmm24, [rbx] vsubps zmm24{k5}{z}, zmm24, [rbx]{1to16} vsubps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vsubps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vsubsd xmm2, xmm7, xmm0 vsubsd xmm2, xmm7, xmm0, {rd-sae} vsubsd xmm2, xmm7, [rbx] vsubsd xmm2, xmm7, [rbx+r11*8+256] vsubsd xmm2, xmm7, [rbx+r11*8-256] vsubsd xmm2{k5}, xmm7, xmm0 vsubsd xmm2{k5}, xmm7, xmm0, {rd-sae} vsubsd xmm2{k5}, xmm7, [rbx] vsubsd xmm2{k5}, xmm7, [rbx+r11*8+256] vsubsd xmm2{k5}, xmm7, [rbx+r11*8-256] vsubsd xmm2{k5}{z}, xmm7, xmm0 vsubsd xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vsubsd xmm2{k5}{z}, xmm7, [rbx] vsubsd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vsubsd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vsubss xmm2, xmm7, xmm0 vsubss xmm2, xmm7, xmm0, {rd-sae} vsubss xmm2, xmm7, [rbx] vsubss xmm2, xmm7, [rbx+r11*8+256] vsubss xmm2, xmm7, [rbx+r11*8-256] vsubss xmm2{k5}, xmm7, xmm0 vsubss xmm2{k5}, xmm7, xmm0, {rd-sae} vsubss xmm2{k5}, xmm7, [rbx] vsubss xmm2{k5}, xmm7, [rbx+r11*8+256] vsubss xmm2{k5}, xmm7, [rbx+r11*8-256] vsubss xmm2{k5}{z}, xmm7, xmm0 vsubss xmm2{k5}{z}, xmm7, xmm0, {rd-sae} vsubss xmm2{k5}{z}, xmm7, [rbx] vsubss xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vsubss xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vucomisd xmm2, xmm0 vucomisd xmm2, xmm0, {sae} vucomisd xmm2, [rbx] vucomisd xmm2, [rbx+r11*8+256] vucomisd xmm2, [rbx+r11*8-256] vucomiss xmm2, xmm0 vucomiss xmm2, xmm0, {sae} vucomiss xmm2, [rbx] vucomiss xmm2, [rbx+r11*8+256] vucomiss xmm2, [rbx+r11*8-256] vunpckhpd xmm2, xmm7, xmm0 vunpckhpd xmm2, xmm7, [rbx] vunpckhpd xmm2, xmm7, [rbx]{1to2} vunpckhpd xmm2, xmm7, [rbx+r11*8+256] vunpckhpd xmm2, xmm7, [rbx+r11*8-256] vunpckhpd xmm2{k5}, xmm7, xmm0 vunpckhpd xmm2{k5}, xmm7, [rbx] vunpckhpd xmm2{k5}, xmm7, [rbx]{1to2} vunpckhpd xmm2{k5}, xmm7, [rbx+r11*8+256] vunpckhpd xmm2{k5}, xmm7, [rbx+r11*8-256] vunpckhpd xmm2{k5}{z}, xmm7, xmm0 vunpckhpd xmm2{k5}{z}, xmm7, [rbx] vunpckhpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vunpckhpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vunpckhpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vunpckhpd ymm16, ymm13, ymm15 vunpckhpd ymm16, ymm13, [rbx] vunpckhpd ymm16, ymm13, [rbx]{1to4} vunpckhpd ymm16, ymm13, [rbx+r11*8+256] vunpckhpd ymm16, ymm13, [rbx+r11*8-256] vunpckhpd ymm16{k5}, ymm13, ymm15 vunpckhpd ymm16{k5}, ymm13, [rbx] vunpckhpd ymm16{k5}, ymm13, [rbx]{1to4} vunpckhpd ymm16{k5}, ymm13, [rbx+r11*8+256] vunpckhpd ymm16{k5}, ymm13, [rbx+r11*8-256] vunpckhpd ymm16{k5}{z}, ymm13, ymm15 vunpckhpd ymm16{k5}{z}, ymm13, [rbx] vunpckhpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vunpckhpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vunpckhpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vunpckhpd zmm24, zmm24, zmm31 vunpckhpd zmm24, zmm24, [rbx] vunpckhpd zmm24, zmm24, [rbx]{1to8} vunpckhpd zmm24, zmm24, [rbx+r11*8+256] vunpckhpd zmm24, zmm24, [rbx+r11*8-256] vunpckhpd zmm24{k5}, zmm24, zmm31 vunpckhpd zmm24{k5}, zmm24, [rbx] vunpckhpd zmm24{k5}, zmm24, [rbx]{1to8} vunpckhpd zmm24{k5}, zmm24, [rbx+r11*8+256] vunpckhpd zmm24{k5}, zmm24, [rbx+r11*8-256] vunpckhpd zmm24{k5}{z}, zmm24, zmm31 vunpckhpd zmm24{k5}{z}, zmm24, [rbx] vunpckhpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vunpckhpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vunpckhpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vunpckhps xmm2, xmm7, xmm0 vunpckhps xmm2, xmm7, [rbx] vunpckhps xmm2, xmm7, [rbx]{1to4} vunpckhps xmm2, xmm7, [rbx+r11*8+256] vunpckhps xmm2, xmm7, [rbx+r11*8-256] vunpckhps xmm2{k5}, xmm7, xmm0 vunpckhps xmm2{k5}, xmm7, [rbx] vunpckhps xmm2{k5}, xmm7, [rbx]{1to4} vunpckhps xmm2{k5}, xmm7, [rbx+r11*8+256] vunpckhps xmm2{k5}, xmm7, [rbx+r11*8-256] vunpckhps xmm2{k5}{z}, xmm7, xmm0 vunpckhps xmm2{k5}{z}, xmm7, [rbx] vunpckhps xmm2{k5}{z}, xmm7, [rbx]{1to4} vunpckhps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vunpckhps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vunpckhps ymm16, ymm13, ymm15 vunpckhps ymm16, ymm13, [rbx] vunpckhps ymm16, ymm13, [rbx]{1to8} vunpckhps ymm16, ymm13, [rbx+r11*8+256] vunpckhps ymm16, ymm13, [rbx+r11*8-256] vunpckhps ymm16{k5}, ymm13, ymm15 vunpckhps ymm16{k5}, ymm13, [rbx] vunpckhps ymm16{k5}, ymm13, [rbx]{1to8} vunpckhps ymm16{k5}, ymm13, [rbx+r11*8+256] vunpckhps ymm16{k5}, ymm13, [rbx+r11*8-256] vunpckhps ymm16{k5}{z}, ymm13, ymm15 vunpckhps ymm16{k5}{z}, ymm13, [rbx] vunpckhps ymm16{k5}{z}, ymm13, [rbx]{1to8} vunpckhps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vunpckhps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vunpckhps zmm24, zmm24, zmm31 vunpckhps zmm24, zmm24, [rbx] vunpckhps zmm24, zmm24, [rbx]{1to16} vunpckhps zmm24, zmm24, [rbx+r11*8+256] vunpckhps zmm24, zmm24, [rbx+r11*8-256] vunpckhps zmm24{k5}, zmm24, zmm31 vunpckhps zmm24{k5}, zmm24, [rbx] vunpckhps zmm24{k5}, zmm24, [rbx]{1to16} vunpckhps zmm24{k5}, zmm24, [rbx+r11*8+256] vunpckhps zmm24{k5}, zmm24, [rbx+r11*8-256] vunpckhps zmm24{k5}{z}, zmm24, zmm31 vunpckhps zmm24{k5}{z}, zmm24, [rbx] vunpckhps zmm24{k5}{z}, zmm24, [rbx]{1to16} vunpckhps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vunpckhps zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vunpcklpd xmm2, xmm7, xmm0 vunpcklpd xmm2, xmm7, [rbx] vunpcklpd xmm2, xmm7, [rbx]{1to2} vunpcklpd xmm2, xmm7, [rbx+r11*8+256] vunpcklpd xmm2, xmm7, [rbx+r11*8-256] vunpcklpd xmm2{k5}, xmm7, xmm0 vunpcklpd xmm2{k5}, xmm7, [rbx] vunpcklpd xmm2{k5}, xmm7, [rbx]{1to2} vunpcklpd xmm2{k5}, xmm7, [rbx+r11*8+256] vunpcklpd xmm2{k5}, xmm7, [rbx+r11*8-256] vunpcklpd xmm2{k5}{z}, xmm7, xmm0 vunpcklpd xmm2{k5}{z}, xmm7, [rbx] vunpcklpd xmm2{k5}{z}, xmm7, [rbx]{1to2} vunpcklpd xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vunpcklpd xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vunpcklpd ymm16, ymm13, ymm15 vunpcklpd ymm16, ymm13, [rbx] vunpcklpd ymm16, ymm13, [rbx]{1to4} vunpcklpd ymm16, ymm13, [rbx+r11*8+256] vunpcklpd ymm16, ymm13, [rbx+r11*8-256] vunpcklpd ymm16{k5}, ymm13, ymm15 vunpcklpd ymm16{k5}, ymm13, [rbx] vunpcklpd ymm16{k5}, ymm13, [rbx]{1to4} vunpcklpd ymm16{k5}, ymm13, [rbx+r11*8+256] vunpcklpd ymm16{k5}, ymm13, [rbx+r11*8-256] vunpcklpd ymm16{k5}{z}, ymm13, ymm15 vunpcklpd ymm16{k5}{z}, ymm13, [rbx] vunpcklpd ymm16{k5}{z}, ymm13, [rbx]{1to4} vunpcklpd ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vunpcklpd ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vunpcklpd zmm24, zmm24, zmm31 vunpcklpd zmm24, zmm24, [rbx] vunpcklpd zmm24, zmm24, [rbx]{1to8} vunpcklpd zmm24, zmm24, [rbx+r11*8+256] vunpcklpd zmm24, zmm24, [rbx+r11*8-256] vunpcklpd zmm24{k5}, zmm24, zmm31 vunpcklpd zmm24{k5}, zmm24, [rbx] vunpcklpd zmm24{k5}, zmm24, [rbx]{1to8} vunpcklpd zmm24{k5}, zmm24, [rbx+r11*8+256] vunpcklpd zmm24{k5}, zmm24, [rbx+r11*8-256] vunpcklpd zmm24{k5}{z}, zmm24, zmm31 vunpcklpd zmm24{k5}{z}, zmm24, [rbx] vunpcklpd zmm24{k5}{z}, zmm24, [rbx]{1to8} vunpcklpd zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vunpcklpd zmm24{k5}{z}, zmm24, [rbx+r11*8-256] vunpcklps xmm2, xmm7, xmm0 vunpcklps xmm2, xmm7, [rbx] vunpcklps xmm2, xmm7, [rbx]{1to4} vunpcklps xmm2, xmm7, [rbx+r11*8+256] vunpcklps xmm2, xmm7, [rbx+r11*8-256] vunpcklps xmm2{k5}, xmm7, xmm0 vunpcklps xmm2{k5}, xmm7, [rbx] vunpcklps xmm2{k5}, xmm7, [rbx]{1to4} vunpcklps xmm2{k5}, xmm7, [rbx+r11*8+256] vunpcklps xmm2{k5}, xmm7, [rbx+r11*8-256] vunpcklps xmm2{k5}{z}, xmm7, xmm0 vunpcklps xmm2{k5}{z}, xmm7, [rbx] vunpcklps xmm2{k5}{z}, xmm7, [rbx]{1to4} vunpcklps xmm2{k5}{z}, xmm7, [rbx+r11*8+256] vunpcklps xmm2{k5}{z}, xmm7, [rbx+r11*8-256] vunpcklps ymm16, ymm13, ymm15 vunpcklps ymm16, ymm13, [rbx] vunpcklps ymm16, ymm13, [rbx]{1to8} vunpcklps ymm16, ymm13, [rbx+r11*8+256] vunpcklps ymm16, ymm13, [rbx+r11*8-256] vunpcklps ymm16{k5}, ymm13, ymm15 vunpcklps ymm16{k5}, ymm13, [rbx] vunpcklps ymm16{k5}, ymm13, [rbx]{1to8} vunpcklps ymm16{k5}, ymm13, [rbx+r11*8+256] vunpcklps ymm16{k5}, ymm13, [rbx+r11*8-256] vunpcklps ymm16{k5}{z}, ymm13, ymm15 vunpcklps ymm16{k5}{z}, ymm13, [rbx] vunpcklps ymm16{k5}{z}, ymm13, [rbx]{1to8} vunpcklps ymm16{k5}{z}, ymm13, [rbx+r11*8+256] vunpcklps ymm16{k5}{z}, ymm13, [rbx+r11*8-256] vunpcklps zmm24, zmm24, zmm31 vunpcklps zmm24, zmm24, [rbx] vunpcklps zmm24, zmm24, [rbx]{1to16} vunpcklps zmm24, zmm24, [rbx+r11*8+256] vunpcklps zmm24, zmm24, [rbx+r11*8-256] vunpcklps zmm24{k5}, zmm24, zmm31 vunpcklps zmm24{k5}, zmm24, [rbx] vunpcklps zmm24{k5}, zmm24, [rbx]{1to16} vunpcklps zmm24{k5}, zmm24, [rbx+r11*8+256] vunpcklps zmm24{k5}, zmm24, [rbx+r11*8-256] vunpcklps zmm24{k5}{z}, zmm24, zmm31 vunpcklps zmm24{k5}{z}, zmm24, [rbx] vunpcklps zmm24{k5}{z}, zmm24, [rbx]{1to16} vunpcklps zmm24{k5}{z}, zmm24, [rbx+r11*8+256] vunpcklps zmm24{k5}{z}, zmm24, [rbx+r11*8-256]