├── .gitignore
├── Java
    ├── SignatureGenerator
    │   ├── pom.xml
    │   └── src
    │   │   └── main
    │   │       └── java
    │   │           └── converter
    │   │               ├── Main.java
    │   │               └── Signature.java
    └── signature-june2016.txt
├── LICENSE
├── Python
    ├── extract.py
    ├── html
    │   └── style.css
    ├── htmltext.py
    ├── htmltext.py.orig
    ├── pdftable.py
    ├── pdftable.py.orig
    ├── x86manual.py
    └── x86manual.py.orig
├── README.md
├── html
    ├── AAA.html
    ├── AAD.html
    ├── AAM.html
    ├── AAS.html
    ├── ADC.html
    ├── ADCX.html
    ├── ADD.html
    ├── ADDPD.html
    ├── ADDPS.html
    ├── ADDSD.html
    ├── ADDSS.html
    ├── ADDSUBPD.html
    ├── ADDSUBPS.html
    ├── ADOX.html
    ├── AESDEC.html
    ├── AESDECLAST.html
    ├── AESENC.html
    ├── AESENCLAST.html
    ├── AESIMC.html
    ├── AESKEYGENASSIST.html
    ├── AND.html
    ├── ANDN.html
    ├── ANDNPD.html
    ├── ANDNPS.html
    ├── ANDPD.html
    ├── ANDPS.html
    ├── ARPL.html
    ├── BEXTR.html
    ├── BLENDPD.html
    ├── BLENDPS.html
    ├── BLENDVPD.html
    ├── BLENDVPS.html
    ├── BLSI.html
    ├── BLSMSK.html
    ├── BLSR.html
    ├── BNDCL.html
    ├── BNDCU_BNDCN.html
    ├── BNDLDX.html
    ├── BNDMK.html
    ├── BNDMOV.html
    ├── BNDSTX.html
    ├── BOUND.html
    ├── BSF.html
    ├── BSR.html
    ├── BSWAP.html
    ├── BT.html
    ├── BTC.html
    ├── BTR.html
    ├── BTS.html
    ├── BZHI.html
    ├── CALL.html
    ├── CBW_CWDE_CDQE.html
    ├── CLAC.html
    ├── CLC.html
    ├── CLD.html
    ├── CLFLUSH.html
    ├── CLFLUSHOPT.html
    ├── CLI.html
    ├── CLTS.html
    ├── CMC.html
    ├── CMOVcc.html
    ├── CMP.html
    ├── CMPPD.html
    ├── CMPPS.html
    ├── CMPSD.html
    ├── CMPSS.html
    ├── CMPS_CMPSB_CMPSW_CMPSD_CMPSQ.html
    ├── CMPXCHG.html
    ├── CMPXCHG8B_CMPXCHG16B.html
    ├── COMISD.html
    ├── COMISS.html
    ├── CPUID.html
    ├── CRC32.html
    ├── CVTDQ2PD.html
    ├── CVTDQ2PS.html
    ├── CVTPD2DQ.html
    ├── CVTPD2PI.html
    ├── CVTPD2PS.html
    ├── CVTPI2PD.html
    ├── CVTPI2PS.html
    ├── CVTPS2DQ.html
    ├── CVTPS2PD.html
    ├── CVTPS2PI.html
    ├── CVTSD2SI.html
    ├── CVTSD2SS.html
    ├── CVTSI2SD.html
    ├── CVTSI2SS.html
    ├── CVTSS2SD.html
    ├── CVTSS2SI.html
    ├── CVTTPD2DQ.html
    ├── CVTTPD2PI.html
    ├── CVTTPS2DQ.html
    ├── CVTTPS2PI.html
    ├── CVTTSD2SI.html
    ├── CVTTSS2SI.html
    ├── CWD_CDQ_CQO.html
    ├── DAA.html
    ├── DAS.html
    ├── DEC.html
    ├── DIV.html
    ├── DIVPD.html
    ├── DIVPS.html
    ├── DIVSD.html
    ├── DIVSS.html
    ├── DPPD.html
    ├── DPPS.html
    ├── EMMS.html
    ├── ENTER.html
    ├── EXTRACTPS.html
    ├── F2XM1.html
    ├── FABS.html
    ├── FADD_FADDP_FIADD.html
    ├── FBLD.html
    ├── FBSTP.html
    ├── FCHS.html
    ├── FCLEX_FNCLEX.html
    ├── FCMOVcc.html
    ├── FCOMI_FCOMIP_FUCOMI_FUCOMIP.html
    ├── FCOM_FCOMP_FCOMPP.html
    ├── FCOS.html
    ├── FDECSTP.html
    ├── FDIVR_FDIVRP_FIDIVR.html
    ├── FDIV_FDIVP_FIDIV.html
    ├── FFREE.html
    ├── FICOM_FICOMP.html
    ├── FILD.html
    ├── FINCSTP.html
    ├── FINIT_FNINIT.html
    ├── FISTTP.html
    ├── FIST_FISTP.html
    ├── FLD.html
    ├── FLD1_FLDL2T_FLDL2E_FLDPI_FLDLG2_FLDLN2_FLDZ.html
    ├── FLDCW.html
    ├── FLDENV.html
    ├── FMUL_FMULP_FIMUL.html
    ├── FNOP.html
    ├── FPATAN.html
    ├── FPREM.html
    ├── FPREM1.html
    ├── FPTAN.html
    ├── FRNDINT.html
    ├── FRSTOR.html
    ├── FSAVE_FNSAVE.html
    ├── FSCALE.html
    ├── FSIN.html
    ├── FSINCOS.html
    ├── FSQRT.html
    ├── FSTCW_FNSTCW.html
    ├── FSTENV_FNSTENV.html
    ├── FSTSW_FNSTSW.html
    ├── FST_FSTP.html
    ├── FSUBR_FSUBRP_FISUBR.html
    ├── FSUB_FSUBP_FISUB.html
    ├── FTST.html
    ├── FUCOM_FUCOMP_FUCOMPP.html
    ├── FXAM.html
    ├── FXCH.html
    ├── FXRSTOR.html
    ├── FXSAVE.html
    ├── FXTRACT.html
    ├── FYL2X.html
    ├── FYL2XP1.html
    ├── HADDPD.html
    ├── HADDPS.html
    ├── HLT.html
    ├── HSUBPD.html
    ├── HSUBPS.html
    ├── IDIV.html
    ├── IMUL.html
    ├── IN.html
    ├── INC.html
    ├── INSERTPS.html
    ├── INS_INSB_INSW_INSD.html
    ├── INT n_INTO_INT 3.html
    ├── INVD.html
    ├── INVLPG.html
    ├── INVPCID.html
    ├── IRET_IRETD.html
    ├── JMP.html
    ├── Jcc.html
    ├── KADDW_KADDB_KADDQ_KADDD.html
    ├── KANDNW_KANDNB_KANDNQ_KANDND.html
    ├── KANDW_KANDB_KANDQ_KANDD.html
    ├── KMOVW_KMOVB_KMOVQ_KMOVD.html
    ├── KNOTW_KNOTB_KNOTQ_KNOTD.html
    ├── KORTESTW_KORTESTB_KORTESTQ_KORTESTD.html
    ├── KORW_KORB_KORQ_KORD.html
    ├── KSHIFTLW_KSHIFTLB_KSHIFTLQ_KSHIFTLD.html
    ├── KSHIFTRW_KSHIFTRB_KSHIFTRQ_KSHIFTRD.html
    ├── KTESTW_KTESTB_KTESTQ_KTESTD.html
    ├── KUNPCKBW_KUNPCKWD_KUNPCKDQ.html
    ├── KXNORW_KXNORB_KXNORQ_KXNORD.html
    ├── KXORW_KXORB_KXORQ_KXORD.html
    ├── LAHF.html
    ├── LAR.html
    ├── LDDQU.html
    ├── LDMXCSR.html
    ├── LDS_LES_LFS_LGS_LSS.html
    ├── LEA.html
    ├── LEAVE.html
    ├── LFENCE.html
    ├── LGDT_LIDT.html
    ├── LLDT.html
    ├── LMSW.html
    ├── LOCK.html
    ├── LODS_LODSB_LODSW_LODSD_LODSQ.html
    ├── LOOP_LOOPcc.html
    ├── LSL.html
    ├── LTR.html
    ├── LZCNT.html
    ├── MASKMOVDQU.html
    ├── MASKMOVQ.html
    ├── MAXPD.html
    ├── MAXPS.html
    ├── MAXSD.html
    ├── MAXSS.html
    ├── MFENCE.html
    ├── MINPD.html
    ├── MINPS.html
    ├── MINSD.html
    ├── MINSS.html
    ├── MONITOR.html
    ├── MOV-1.html
    ├── MOV-2.html
    ├── MOV.html
    ├── MOVAPD.html
    ├── MOVAPS.html
    ├── MOVBE.html
    ├── MOVDDUP.html
    ├── MOVDQ2Q.html
    ├── MOVDQA,VMOVDQA32_64.html
    ├── MOVDQU,VMOVDQU8_16_32_64.html
    ├── MOVD_MOVQ.html
    ├── MOVHLPS.html
    ├── MOVHPD.html
    ├── MOVHPS.html
    ├── MOVLHPS.html
    ├── MOVLPD.html
    ├── MOVLPS.html
    ├── MOVMSKPD.html
    ├── MOVMSKPS.html
    ├── MOVNTDQ.html
    ├── MOVNTDQA.html
    ├── MOVNTI.html
    ├── MOVNTPD.html
    ├── MOVNTPS.html
    ├── MOVNTQ.html
    ├── MOVQ.html
    ├── MOVQ2DQ.html
    ├── MOVSD.html
    ├── MOVSHDUP.html
    ├── MOVSLDUP.html
    ├── MOVSS.html
    ├── MOVSX_MOVSXD.html
    ├── MOVS_MOVSB_MOVSW_MOVSD_MOVSQ.html
    ├── MOVUPD.html
    ├── MOVUPS.html
    ├── MOVZX.html
    ├── MPSADBW.html
    ├── MUL.html
    ├── MULPD.html
    ├── MULPS.html
    ├── MULSD.html
    ├── MULSS.html
    ├── MULX.html
    ├── MWAIT.html
    ├── NEG.html
    ├── NOP.html
    ├── NOT.html
    ├── OR.html
    ├── ORPD.html
    ├── ORPS.html
    ├── OUT.html
    ├── OUTS_OUTSB_OUTSW_OUTSD.html
    ├── PABSB_PABSW_PABSD_PABSQ.html
    ├── PACKSSWB_PACKSSDW.html
    ├── PACKUSDW.html
    ├── PACKUSWB.html
    ├── PADDB_PADDW_PADDD_PADDQ.html
    ├── PADDSB_PADDSW.html
    ├── PADDUSB_PADDUSW.html
    ├── PALIGNR.html
    ├── PAND.html
    ├── PANDN.html
    ├── PAUSE.html
    ├── PAVGB_PAVGW.html
    ├── PBLENDVB.html
    ├── PBLENDW.html
    ├── PCLMULQDQ.html
    ├── PCMPEQB_PCMPEQW_PCMPEQD.html
    ├── PCMPEQQ.html
    ├── PCMPESTRI.html
    ├── PCMPESTRM.html
    ├── PCMPGTB_PCMPGTW_PCMPGTD.html
    ├── PCMPGTQ.html
    ├── PCMPISTRI.html
    ├── PCMPISTRM.html
    ├── PDEP.html
    ├── PEXT.html
    ├── PEXTRB_PEXTRD_PEXTRQ.html
    ├── PEXTRW.html
    ├── PHADDSW.html
    ├── PHADDW_PHADDD.html
    ├── PHMINPOSUW.html
    ├── PHSUBSW.html
    ├── PHSUBW_PHSUBD.html
    ├── PINSRB_PINSRD_PINSRQ.html
    ├── PINSRW.html
    ├── PMADDUBSW.html
    ├── PMADDWD.html
    ├── PMAXSB_PMAXSW_PMAXSD_PMAXSQ.html
    ├── PMAXUB_PMAXUW.html
    ├── PMAXUD_PMAXUQ.html
    ├── PMINSB_PMINSW.html
    ├── PMINSD_PMINSQ.html
    ├── PMINUB_PMINUW.html
    ├── PMINUD_PMINUQ.html
    ├── PMOVMSKB.html
    ├── PMOVSX.html
    ├── PMOVZX.html
    ├── PMULDQ.html
    ├── PMULHRSW.html
    ├── PMULHUW.html
    ├── PMULHW.html
    ├── PMULLD_PMULLQ.html
    ├── PMULLW.html
    ├── PMULUDQ.html
    ├── POP.html
    ├── POPA_POPAD.html
    ├── POPCNT.html
    ├── POPF_POPFD_POPFQ.html
    ├── POR.html
    ├── PREFETCHW.html
    ├── PREFETCHWT1.html
    ├── PREFETCHh.html
    ├── PROLD_PROLVD_PROLQ_PROLVQ.html
    ├── PRORD_PRORVD_PRORQ_PRORVQ.html
    ├── PSADBW.html
    ├── PSHUFB.html
    ├── PSHUFD.html
    ├── PSHUFHW.html
    ├── PSHUFLW.html
    ├── PSHUFW.html
    ├── PSIGNB_PSIGNW_PSIGND.html
    ├── PSLLDQ.html
    ├── PSLLW_PSLLD_PSLLQ.html
    ├── PSRAW_PSRAD_PSRAQ.html
    ├── PSRLDQ.html
    ├── PSRLW_PSRLD_PSRLQ.html
    ├── PSUBB_PSUBW_PSUBD.html
    ├── PSUBQ.html
    ├── PSUBSB_PSUBSW.html
    ├── PSUBUSB_PSUBUSW.html
    ├── PTEST.html
    ├── PTWRITE.html
    ├── PUNPCKHBW_PUNPCKHWD_PUNPCKHDQ_PUNPCKHQDQ.html
    ├── PUNPCKLBW_PUNPCKLWD_PUNPCKLDQ_PUNPCKLQDQ.html
    ├── PUSH.html
    ├── PUSHA_PUSHAD.html
    ├── PUSHF_PUSHFD.html
    ├── PXOR.html
    ├── RCL_RCR_ROL_ROR.html
    ├── RCPPS.html
    ├── RCPSS.html
    ├── RDFSBASE_RDGSBASE.html
    ├── RDMSR.html
    ├── RDPID.html
    ├── RDPKRU.html
    ├── RDPMC.html
    ├── RDRAND.html
    ├── RDSEED.html
    ├── RDTSC.html
    ├── RDTSCP.html
    ├── REP_REPE_REPZ_REPNE_REPNZ.html
    ├── RET.html
    ├── RORX.html
    ├── ROUNDPD.html
    ├── ROUNDPS.html
    ├── ROUNDSD.html
    ├── ROUNDSS.html
    ├── RSM.html
    ├── RSQRTPS.html
    ├── RSQRTSS.html
    ├── SAHF.html
    ├── SAL_SAR_SHL_SHR.html
    ├── SARX_SHLX_SHRX.html
    ├── SBB.html
    ├── SCAS_SCASB_SCASW_SCASD.html
    ├── SETcc.html
    ├── SFENCE.html
    ├── SGDT.html
    ├── SHA1MSG1.html
    ├── SHA1MSG2.html
    ├── SHA1NEXTE.html
    ├── SHA1RNDS4.html
    ├── SHA256MSG1.html
    ├── SHA256MSG2.html
    ├── SHA256RNDS2.html
    ├── SHLD.html
    ├── SHRD.html
    ├── SHUFPD.html
    ├── SHUFPS.html
    ├── SIDT.html
    ├── SLDT.html
    ├── SMSW.html
    ├── SQRTPD.html
    ├── SQRTPS.html
    ├── SQRTSD.html
    ├── SQRTSS.html
    ├── STAC.html
    ├── STC.html
    ├── STD.html
    ├── STI.html
    ├── STMXCSR.html
    ├── STOS_STOSB_STOSW_STOSD_STOSQ.html
    ├── STR.html
    ├── SUB.html
    ├── SUBPD.html
    ├── SUBPS.html
    ├── SUBSD.html
    ├── SUBSS.html
    ├── SWAPGS.html
    ├── SYSCALL.html
    ├── SYSENTER.html
    ├── SYSEXIT.html
    ├── SYSRET.html
    ├── TEST.html
    ├── TZCNT.html
    ├── UCOMISD.html
    ├── UCOMISS.html
    ├── UD2.html
    ├── UNPCKHPD.html
    ├── UNPCKHPS.html
    ├── UNPCKLPD.html
    ├── UNPCKLPS.html
    ├── VALIGND_VALIGNQ.html
    ├── VBLENDMPD_VBLENDMPS.html
    ├── VBROADCAST.html
    ├── VCOMPRESSPD.html
    ├── VCOMPRESSPS.html
    ├── VCVTPD2QQ.html
    ├── VCVTPD2UDQ.html
    ├── VCVTPD2UQQ.html
    ├── VCVTPH2PS.html
    ├── VCVTPS2PH.html
    ├── VCVTPS2QQ.html
    ├── VCVTPS2UDQ.html
    ├── VCVTPS2UQQ.html
    ├── VCVTQQ2PD.html
    ├── VCVTQQ2PS.html
    ├── VCVTSD2USI.html
    ├── VCVTSS2USI.html
    ├── VCVTTPD2QQ.html
    ├── VCVTTPD2UDQ.html
    ├── VCVTTPD2UQQ.html
    ├── VCVTTPS2QQ.html
    ├── VCVTTPS2UDQ.html
    ├── VCVTTPS2UQQ.html
    ├── VCVTTSD2USI.html
    ├── VCVTTSS2USI.html
    ├── VCVTUDQ2PD.html
    ├── VCVTUDQ2PS.html
    ├── VCVTUQQ2PD.html
    ├── VCVTUQQ2PS.html
    ├── VCVTUSI2SD.html
    ├── VCVTUSI2SS.html
    ├── VDBPSADBW.html
    ├── VERR_VERW.html
    ├── VEXP2PD.html
    ├── VEXP2PS.html
    ├── VEXPANDPD.html
    ├── VEXPANDPS.html
    ├── VEXTRACTF128_VEXTRACTF32x4_VEXTRACTF64x2_VEXTRACTF32x8_VEXTRACTF64x4.html
    ├── VEXTRACTI128_VEXTRACTI32x4_VEXTRACTI64x2_VEXTRACTI32x8_VEXTRACTI64x4.html
    ├── VFIXUPIMMPD.html
    ├── VFIXUPIMMPS.html
    ├── VFIXUPIMMSD.html
    ├── VFIXUPIMMSS.html
    ├── VFMADD132PD_VFMADD213PD_VFMADD231PD.html
    ├── VFMADD132PS_VFMADD213PS_VFMADD231PS.html
    ├── VFMADD132SD_VFMADD213SD_VFMADD231SD.html
    ├── VFMADD132SS_VFMADD213SS_VFMADD231SS.html
    ├── VFMADDSUB132PD_VFMADDSUB213PD_VFMADDSUB231PD.html
    ├── VFMADDSUB132PS_VFMADDSUB213PS_VFMADDSUB231PS.html
    ├── VFMSUB132PD_VFMSUB213PD_VFMSUB231PD.html
    ├── VFMSUB132PS_VFMSUB213PS_VFMSUB231PS.html
    ├── VFMSUB132SD_VFMSUB213SD_VFMSUB231SD.html
    ├── VFMSUB132SS_VFMSUB213SS_VFMSUB231SS.html
    ├── VFMSUBADD132PD_VFMSUBADD213PD_VFMSUBADD231PD.html
    ├── VFMSUBADD132PS_VFMSUBADD213PS_VFMSUBADD231PS.html
    ├── VFNMADD132PD_VFNMADD213PD_VFNMADD231PD.html
    ├── VFNMADD132PS_VFNMADD213PS_VFNMADD231PS.html
    ├── VFNMADD132SD_VFNMADD213SD_VFNMADD231SD.html
    ├── VFNMADD132SS_VFNMADD213SS_VFNMADD231SS.html
    ├── VFNMSUB132PD_VFNMSUB213PD_VFNMSUB231PD.html
    ├── VFNMSUB132PS_VFNMSUB213PS_VFNMSUB231PS.html
    ├── VFNMSUB132SD_VFNMSUB213SD_VFNMSUB231SD.html
    ├── VFNMSUB132SS_VFNMSUB213SS_VFNMSUB231SS.html
    ├── VFPCLASSPD.html
    ├── VFPCLASSPS.html
    ├── VFPCLASSSD.html
    ├── VFPCLASSSS.html
    ├── VGATHERDPD_VGATHERQPD.html
    ├── VGATHERDPS_VGATHERDPD.html
    ├── VGATHERDPS_VGATHERQPS.html
    ├── VGATHERPF0DPS_VGATHERPF0QPS_VGATHERPF0DPD_VGATHERPF0QPD.html
    ├── VGATHERPF1DPS_VGATHERPF1QPS_VGATHERPF1DPD_VGATHERPF1QPD.html
    ├── VGATHERQPS_VGATHERQPD.html
    ├── VGETEXPPD.html
    ├── VGETEXPPS.html
    ├── VGETEXPSD.html
    ├── VGETEXPSS.html
    ├── VGETMANTPD.html
    ├── VGETMANTPS.html
    ├── VGETMANTSD.html
    ├── VGETMANTSS.html
    ├── VINSERTF128_VINSERTF32x4_VINSERTF64x2_VINSERTF32x8_VINSERTF64x4.html
    ├── VINSERTI128_VINSERTI32x4_VINSERTI64x2_VINSERTI32x8_VINSERTI64x4.html
    ├── VMASKMOV.html
    ├── VPBLENDD.html
    ├── VPBLENDMB_VPBLENDMW.html
    ├── VPBLENDMD_VPBLENDMQ.html
    ├── VPBROADCAST.html
    ├── VPBROADCASTB_W_D_Q.html
    ├── VPBROADCASTM.html
    ├── VPCMPB_VPCMPUB.html
    ├── VPCMPD_VPCMPUD.html
    ├── VPCMPQ_VPCMPUQ.html
    ├── VPCMPW_VPCMPUW.html
    ├── VPCOMPRESSD.html
    ├── VPCOMPRESSQ.html
    ├── VPCONFLICTD_Q.html
    ├── VPERM2F128.html
    ├── VPERM2I128.html
    ├── VPERMD_VPERMW.html
    ├── VPERMI2W_D_Q_PS_PD.html
    ├── VPERMILPD.html
    ├── VPERMILPS.html
    ├── VPERMPD.html
    ├── VPERMPS.html
    ├── VPERMQ.html
    ├── VPEXPANDD.html
    ├── VPEXPANDQ.html
    ├── VPGATHERDD_VPGATHERDQ.html
    ├── VPGATHERDD_VPGATHERQD.html
    ├── VPGATHERDQ_VPGATHERQQ.html
    ├── VPGATHERQD_VPGATHERQQ.html
    ├── VPLZCNTD_Q.html
    ├── VPMASKMOV.html
    ├── VPMOVB2M_VPMOVW2M_VPMOVD2M_VPMOVQ2M.html
    ├── VPMOVDB_VPMOVSDB_VPMOVUSDB.html
    ├── VPMOVDW_VPMOVSDW_VPMOVUSDW.html
    ├── VPMOVM2B_VPMOVM2W_VPMOVM2D_VPMOVM2Q.html
    ├── VPMOVQB_VPMOVSQB_VPMOVUSQB.html
    ├── VPMOVQD_VPMOVSQD_VPMOVUSQD.html
    ├── VPMOVQW_VPMOVSQW_VPMOVUSQW.html
    ├── VPMOVWB_VPMOVSWB_VPMOVUSWB.html
    ├── VPSCATTERDD_VPSCATTERDQ_VPSCATTERQD_VPSCATTERQQ.html
    ├── VPSLLVW_VPSLLVD_VPSLLVQ.html
    ├── VPSRAVW_VPSRAVD_VPSRAVQ.html
    ├── VPSRLVW_VPSRLVD_VPSRLVQ.html
    ├── VPTERNLOGD_VPTERNLOGQ.html
    ├── VPTESTMB_VPTESTMW_VPTESTMD_VPTESTMQ.html
    ├── VPTESTNMB_W_D_Q.html
    ├── VRANGEPD.html
    ├── VRANGEPS.html
    ├── VRANGESD.html
    ├── VRANGESS.html
    ├── VRCP14PD.html
    ├── VRCP14PS.html
    ├── VRCP14SD.html
    ├── VRCP14SS.html
    ├── VRCP28PD.html
    ├── VRCP28PS.html
    ├── VRCP28SD.html
    ├── VRCP28SS.html
    ├── VREDUCEPD.html
    ├── VREDUCEPS.html
    ├── VREDUCESD.html
    ├── VREDUCESS.html
    ├── VRNDSCALEPD.html
    ├── VRNDSCALEPS.html
    ├── VRNDSCALESD.html
    ├── VRNDSCALESS.html
    ├── VRSQRT14PD.html
    ├── VRSQRT14PS.html
    ├── VRSQRT14SD.html
    ├── VRSQRT14SS.html
    ├── VRSQRT28PD.html
    ├── VRSQRT28PS.html
    ├── VRSQRT28SD.html
    ├── VRSQRT28SS.html
    ├── VSCALEFPD.html
    ├── VSCALEFPS.html
    ├── VSCALEFSD.html
    ├── VSCALEFSS.html
    ├── VSCATTERDPS_VSCATTERDPD_VSCATTERQPS_VSCATTERQPD.html
    ├── VSCATTERPF0DPS_VSCATTERPF0QPS_VSCATTERPF0DPD_VSCATTERPF0QPD.html
    ├── VSCATTERPF1DPS_VSCATTERPF1QPS_VSCATTERPF1DPD_VSCATTERPF1QPD.html
    ├── VSHUFF32x4_VSHUFF64x2_VSHUFI32x4_VSHUFI64x2.html
    ├── VTESTPD_VTESTPS.html
    ├── VZEROALL.html
    ├── VZEROUPPER.html
    ├── WAIT_FWAIT.html
    ├── WBINVD.html
    ├── WRFSBASE_WRGSBASE.html
    ├── WRMSR.html
    ├── WRPKRU.html
    ├── XABORT.html
    ├── XACQUIRE_XRELEASE.html
    ├── XADD.html
    ├── XBEGIN.html
    ├── XCHG.html
    ├── XEND.html
    ├── XGETBV.html
    ├── XLAT_XLATB.html
    ├── XOR.html
    ├── XORPD.html
    ├── XORPS.html
    ├── XRSTOR.html
    ├── XRSTORS.html
    ├── XSAVE.html
    ├── XSAVEC.html
    ├── XSAVEOPT.html
    ├── XSAVES.html
    ├── XSETBV.html
    ├── XTEST.html
    └── style.css
├── index.html
└── parsejson.py


/.gitignore:
--------------------------------------------------------------------------------
1 | .*
2 | *.pdf
3 | *.pyc
4 | *.pyo
5 | *.json
6 | pdfminer/*
7 | html/*
8 | **/target/*
9 | 


--------------------------------------------------------------------------------
/Java/SignatureGenerator/pom.xml:
--------------------------------------------------------------------------------
 1 | <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
 2 | 	<modelVersion>4.0.0</modelVersion>
 3 | 	
 4 | 	<groupId>hjlebbink</groupId>
 5 | 	<artifactId>SignatureGenerator</artifactId>
 6 | 	<version>1.0.0-SNAPSHOT</version>
 7 | 	
 8 |      <dependencies>
 9 |      	<!-- logging -->
10 | 		<dependency>
11 | 			<groupId>org.slf4j</groupId>
12 | 			<artifactId>slf4j-api</artifactId>
13 | 			<version>1.7.16</version>
14 | 		</dependency>
15 | 		<dependency>
16 | 			<groupId>ch.qos.logback</groupId>
17 | 			<artifactId>logback-core</artifactId>
18 | 			<version>1.1.5</version>
19 | 		</dependency>
20 | 		<dependency>
21 | 			<groupId>ch.qos.logback</groupId>
22 | 			<artifactId>logback-classic</artifactId>
23 | 			<version>1.1.5</version>
24 | 		</dependency>
25 |      </dependencies>
26 | 
27 |     <!-- 
28 | 	<build>
29 |     <plugins>
30 |       <plugin>
31 |         <artifactId>maven-compiler-plugin</artifactId>
32 |         <version>3.5.1</version>
33 |         <configuration>
34 |           <source/>
35 |           <target/>
36 |         </configuration>
37 |       </plugin>
38 |       <plugin>
39 |         <artifactId>maven-surfire-plugin</artifactId>
40 |         <version>2.19.1</version>
41 |       </plugin>
42 |     </plugins>
43 |   </build>
44 |      -->
45 |      
46 | </project>


--------------------------------------------------------------------------------
/Java/SignatureGenerator/src/main/java/converter/Signature.java:
--------------------------------------------------------------------------------
 1 | package converter;
 2 | 
 3 | public class Signature implements Comparable<Signature> {
 4 | 	public String mnemonic;
 5 | 	public String operands;
 6 | 	public String operandsDoc;
 7 | 	public String cpuFlags;
 8 | 	public String description;
 9 | 	public Signature(String mnemonic, String operands, String cpuFlags, String operandsDoc, String description) {
10 | 		this.mnemonic = mnemonic;
11 | 		this.operands = operands;
12 | 		this.operandsDoc = operandsDoc;
13 | 		this.cpuFlags = cpuFlags;
14 | 		this.description = description;
15 | 	}
16 | 	public int compareTo(Signature o) {
17 | 		final int i1 = this.mnemonic.compareTo(o.mnemonic);
18 | 		if (i1 != 0) return i1;
19 | 		return this.operands.compareTo(o.operands);
20 | 	}
21 | }
22 | 
23 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | The MIT License (MIT)
 2 | 
 3 | Copyright (c) 2016 Henk-Jan Lebbink
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/Python/extract.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # -*- coding: UTF-8 -*-
 3 | 
 4 | import sys
 5 | from pdfminer.pdfdocument import PDFDocument
 6 | from pdfminer.pdfparser import PDFParser
 7 | from pdfminer.pdfinterp import PDFResourceManager, PDFPageInterpreter
 8 | from pdfminer.pdfpage import PDFPage
 9 | from pdfminer.layout import LAParams
10 | from pdfminer.converter import PDFPageAggregator
11 | from x86manual import x86ManParser
12 | 
13 | def main(argv):
14 | 	for arg in argv[1:]:
15 | 		fd = open(arg)
16 | 		parser = PDFParser(fd)
17 | 		document = PDFDocument(parser)
18 | 		if not document.is_extractable:
19 | 			print "Document not extractable."
20 | 			return 1
21 | 
22 | 		params = LAParams(char_margin=1)
23 | 		resMan = PDFResourceManager(caching=True)
24 | 		device = PDFPageAggregator(resMan, laparams=params)
25 | 		interpreter = PDFPageInterpreter(resMan, device)
26 | 		parser = x86ManParser("html", params)
27 | 
28 | 		i = 1
29 | 		for page in PDFPage.get_pages(fd, set(), caching=True, check_extractable=True):
30 | 			print "Processing page %i" % i
31 | 			interpreter.process_page(page)
32 | 			page = device.get_result()
33 | 			parser.process_page(page)
34 | 			i += 1
35 | 		parser.flush()
36 | 		fd.close()
37 | 
38 | 		print "Conversion result: %i/%i" % (parser.success, parser.success + parser.fail)
39 | 
40 | 		with open("opcodes.json", "wb") as fd:
41 | 			fd.write(parser.output_opcodes_json())
42 | 
43 | if __name__ == "__main__":
44 | 	result = main(sys.argv)
45 | 	sys.exit(result)
46 | 


--------------------------------------------------------------------------------
/Python/html/style.css:
--------------------------------------------------------------------------------
1 | table { border-collapse: collapse }
2 | th, td { padding: 0px 10px; border: 1px #ddd solid; vertical-align: top }
3 | svg { display: block; margin: 0px auto }
4 | svg + h3 { text-align: center; }
5 | 
6 | .notes { font-size: 9pt; }


--------------------------------------------------------------------------------
/html/AAA.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>AAA—ASCII Adjust After Addition </title></head>
 8 | <body>
 9 | <h1>AAA—ASCII Adjust After Addition</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>37</td>
20 | <td>AAA</td>
21 | <td>NP</td>
22 | <td>Invalid</td>
23 | <td>Valid</td>
24 | <td>ASCII adjust AL after addition.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Adjusts the sum of two unpacked BCD values to create an unpacked BCD result. The AL register is the implied source and destination operand for this instruction. The AAA instruction is only useful when it follows an ADD instruction that adds (binary addition) two unpacked BCD values and stores a byte result in the AL register. The AAA instruction then adjusts the contents of the AL register to contain the correct 1-digit unpacked BCD result.</p>
41 | <p>If the addition produces a decimal carry, the AH register increments by 1, and the CF and AF flags are set. If there was no decimal carry, the CF and AF flags are cleared and the AH register is unchanged. In either case, bits 4 through 7 of the AL register are set to 0.</p>
42 | <p>This instruction executes as described in compatibility mode and legacy mode. It is not valid in 64-bit mode.</p>
43 | <h2>Operation</h2>
44 | <pre>IF 64-Bit Mode
45 |     THEN
46 |          #UD;
47 |     ELSE
48 |          IF ((AL AND 0FH) &gt; 9) or (AF = 1)
49 |               THEN
50 |                     AX ← AX + 106H;
51 |                     AF ← 1;
52 |                     CF ← 1;
53 |               ELSE
54 |                     AF ← 0;
55 |                     CF ← 0;
56 |          FI;
57 |          AL ← AL AND 0FH;
58 | FI;</pre>
59 | <h2>Flags Affected</h2>
60 | <p>The AF and CF flags are set to 1 if the adjustment results in a decimal carry; otherwise they are set to 0. The OF, SF, ZF, and PF flags are undefined.</p>
61 | <h2>Protected Mode Exceptions</h2>
62 | <table class="exception-table">
63 | <tr>
64 | <td>#UD</td>
65 | <td>If the LOCK prefix is used.</td></tr></table>
66 | <h2>Real-Address Mode Exceptions</h2>
67 | <p>Same exceptions as protected mode.</p>
68 | <h2>Virtual-8086 Mode Exceptions</h2>
69 | <p>Same exceptions as protected mode.</p>
70 | <h2>Compatibility Mode Exceptions</h2>
71 | <p>Same exceptions as protected mode.</p>
72 | <h2>64-Bit Mode Exceptions</h2>
73 | <table class="exception-table">
74 | <tr>
75 | <td>#UD</td>
76 | <td>If in 64-bit mode.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/AAS.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>AAS—ASCII Adjust AL After Subtraction </title></head>
 8 | <body>
 9 | <h1>AAS—ASCII Adjust AL After Subtraction</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>3F</td>
20 | <td>AAS</td>
21 | <td>NP</td>
22 | <td>Invalid</td>
23 | <td>Valid</td>
24 | <td>ASCII adjust AL after subtraction.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Adjusts the result of the subtraction of two unpacked BCD values to create a unpacked BCD result. The AL register is the implied source and destination operand for this instruction. The AAS instruction is only useful when it follows a SUB instruction that subtracts (binary subtraction) one unpacked BCD value from another and stores a byte result in the AL register. The AAA instruction then adjusts the contents of the AL register to contain the correct 1-digit unpacked BCD result.</p>
41 | <p>If the subtraction produced a decimal carry, the AH register decrements by 1, and the CF and AF flags are set. If no decimal carry occurred, the CF and AF flags are cleared, and the AH register is unchanged. In either case, the AL register is left with its top four bits set to 0.</p>
42 | <p>This instruction executes as described in compatibility mode and legacy mode. It is not valid in 64-bit mode.</p>
43 | <h2>Operation</h2>
44 | <pre>IF 64-bit mode
45 |     THEN
46 |          #UD;
47 |     ELSE
48 |          IF ((AL AND 0FH) &gt; 9) or (AF = 1)
49 |               THEN
50 |                     AX ← AX – 6;
51 |                     AH ← AH – 1;
52 |                     AF ← 1;
53 |                     CF ← 1;
54 |                     AL ← AL AND 0FH;
55 |               ELSE
56 |                     CF ← 0;
57 |                     AF ← 0;
58 |                     AL ← AL AND 0FH;
59 |          FI;
60 | FI;</pre>
61 | <h2>Flags Affected</h2>
62 | <p>The AF and CF flags are set to 1 if there is a decimal borrow; otherwise, they are cleared to 0. The OF, SF, ZF, and PF flags are undefined.</p>
63 | <h2>Protected Mode Exceptions</h2>
64 | <table class="exception-table">
65 | <tr>
66 | <td>#UD</td>
67 | <td>If the LOCK prefix is used.</td></tr></table>
68 | <h2>Real-Address Mode Exceptions</h2>
69 | <p>Same exceptions as protected mode.</p>
70 | <h2>Virtual-8086 Mode Exceptions</h2>
71 | <p>Same exceptions as protected mode.</p>
72 | <h2>Compatibility Mode Exceptions</h2>
73 | <p>Same exceptions as protected mode.</p>
74 | <h2>64-Bit Mode Exceptions</h2>
75 | <table class="exception-table">
76 | <tr>
77 | <td>#UD</td>
78 | <td>If in 64-bit mode.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/AESDEC.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>AESDEC—Perform One Round of an AES Decryption Flow </title></head>
 8 | <body>
 9 | <h1>AESDEC—Perform One Round of an AES Decryption Flow</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32-bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>66 0F 38 DE /r AESDEC xmm1, xmm2/m128</td>
19 | <td>RM</td>
20 | <td>V/V</td>
21 | <td>AES</td>
22 | <td>Perform one round of an AES decryption flow, using the Equivalent Inverse Cipher, operating on a 128-bit data (state) from xmm1 with a 128-bit round key from xmm2/m128.</td></tr>
23 | <tr>
24 | <td>VEX.NDS.128.66.0F38.WIG DE /r VAESDEC xmm1, xmm2, xmm3/m128</td>
25 | <td>RVM</td>
26 | <td>V/V</td>
27 | <td>Both AES and AVX flags</td>
28 | <td>Perform one round of an AES decryption flow, using the Equivalent Inverse Cipher, operating on a 128-bit data (state) from xmm2 with a 128-bit round key from xmm3/m128; store the result in xmm1.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand2</td>
35 | <td>Operand3</td>
36 | <td>Operand4</td></tr>
37 | <tr>
38 | <td>RM</td>
39 | <td>ModRM:reg (r, w)</td>
40 | <td>ModRM:r/m (r)</td>
41 | <td>NA</td>
42 | <td>NA</td></tr>
43 | <tr>
44 | <td>RVM</td>
45 | <td>ModRM:reg (w)</td>
46 | <td>VEX.vvvv (r)</td>
47 | <td>ModRM:r/m (r)</td>
48 | <td>NA</td></tr></table>
49 | <h2>Description</h2>
50 | <p>This instruction performs a single round of the AES decryption flow using the Equivalent Inverse Cipher, with the round key from the second source operand, operating on a 128-bit data (state) from the first source operand, and store the result in the destination operand.</p>
51 | <p>Use the AESDEC instruction for all but the last decryption round. For the last decryption round, use the AESDE-CLAST instruction.</p>
52 | <p>128-bit Legacy SSE version: The first source operand and the destination operand are the same and must be an XMM register. The second source operand can be an XMM register or a 128-bit memory location. Bits (VLMAX-1:128) of the corresponding YMM destination register remain unchanged.</p>
53 | <p>VEX.128 encoded version: The first source operand and the destination operand are XMM registers. The second source operand can be an XMM register or a 128-bit memory location. Bits (VLMAX-1:128) of the destination YMM register are zeroed.</p>
54 | <h2>Operation</h2>
55 | <p><strong>AESDEC</strong></p>
56 | <pre>STATE ← SRC1;
57 | RoundKey ← SRC2;
58 | STATE ← InvShiftRows( STATE );
59 | STATE ← InvSubBytes( STATE );
60 | STATE ← InvMixColumns( STATE );
61 | DEST[127:0] ← STATE XOR RoundKey;
62 | DEST[VLMAX-1:128] (Unmodified)</pre>
63 | <p><strong>VAESDEC</strong></p>
64 | <pre>STATE ← SRC1;
65 | RoundKey ← SRC2;
66 | STATE ← InvShiftRows( STATE );
67 | STATE ← InvSubBytes( STATE );
68 | STATE ← InvMixColumns( STATE );
69 | DEST[127:0] ← STATE XOR RoundKey;
70 | DEST[VLMAX-1:128] ← 0</pre>
71 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
72 | <p>(V)AESDEC:</p>
73 | <p>__m128i _mm_aesdec (__m128i, __m128i)</p>
74 | <h2>SIMD Floating-Point Exceptions</h2>
75 | <p>None</p>
76 | <h2>Other Exceptions</h2>
77 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/AESDECLAST.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>AESDECLAST—Perform Last Round of an AES Decryption Flow </title></head>
 8 | <body>
 9 | <h1>AESDECLAST—Perform Last Round of an AES Decryption Flow</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32-bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>66 0F 38 DF /r AESDECLAST xmm1, xmm2/m128</td>
19 | <td>RM</td>
20 | <td>V/V</td>
21 | <td>AES</td>
22 | <td>Perform the last round of an AES decryption flow, using the Equivalent Inverse Cipher, operating on a 128-bit data (state) from xmm1 with a 128-bit round key from xmm2/m128.</td></tr>
23 | <tr>
24 | <td>VEX.NDS.128.66.0F38.WIG DF /r VAESDECLAST xmm1, xmm2, xmm3/m128</td>
25 | <td>RVM</td>
26 | <td>V/V</td>
27 | <td>Both AES and AVX flags</td>
28 | <td>Perform the last round of an AES decryption flow, using the Equivalent Inverse Cipher, operating on a 128-bit data (state) from xmm2 with a 128-bit round key from xmm3/m128; store the result in xmm1.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand2</td>
35 | <td>Operand3</td>
36 | <td>Operand4</td></tr>
37 | <tr>
38 | <td>RM</td>
39 | <td>ModRM:reg (r, w)</td>
40 | <td>ModRM:r/m (r)</td>
41 | <td>NA</td>
42 | <td>NA</td></tr>
43 | <tr>
44 | <td>RVM</td>
45 | <td>ModRM:reg (w)</td>
46 | <td>VEX.vvvv (r)</td>
47 | <td>ModRM:r/m (r)</td>
48 | <td>NA</td></tr></table>
49 | <h2>Description</h2>
50 | <p>This instruction performs the last round of the AES decryption flow using the Equivalent Inverse Cipher, with the round key from the second source operand, operating on a 128-bit data (state) from the first source operand, and store the result in the destination operand.</p>
51 | <p>128-bit Legacy SSE version: The first source operand and the destination operand are the same and must be an XMM register. The second source operand can be an XMM register or a 128-bit memory location. Bits (VLMAX-1:128) of the corresponding YMM destination register remain unchanged.</p>
52 | <p>VEX.128 encoded version: The first source operand and the destination operand are XMM registers. The second source operand can be an XMM register or a 128-bit memory location. Bits (VLMAX-1:128) of the destination YMM register are zeroed.</p>
53 | <h2>Operation</h2>
54 | <p><strong>AESDECLAST</strong></p>
55 | <pre>STATE ← SRC1;
56 | RoundKey ← SRC2;
57 | STATE ← InvShiftRows( STATE );
58 | STATE ← InvSubBytes( STATE );
59 | DEST[127:0] ← STATE XOR RoundKey;
60 | DEST[VLMAX-1:128] (Unmodified)</pre>
61 | <p><strong>VAESDECLAST</strong></p>
62 | <pre>STATE ← SRC1;
63 | RoundKey ← SRC2;
64 | STATE ← InvShiftRows( STATE );
65 | STATE ← InvSubBytes( STATE );
66 | DEST[127:0] ← STATE XOR RoundKey;
67 | DEST[VLMAX-1:128] ← 0</pre>
68 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
69 | <p>(V)AESDECLAST:</p>
70 | <p>__m128i _mm_aesdeclast (__m128i, __m128i)</p>
71 | <h2>SIMD Floating-Point Exceptions</h2>
72 | <p>None</p>
73 | <h2>Other Exceptions</h2>
74 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/AESENC.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>AESENC—Perform One Round of an AES Encryption Flow </title></head>
 8 | <body>
 9 | <h1>AESENC—Perform One Round of an AES Encryption Flow</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32-bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>66 0F 38 DC /r AESENC xmm1, xmm2/m128</td>
19 | <td>RM</td>
20 | <td>V/V</td>
21 | <td>AES</td>
22 | <td>Perform one round of an AES encryption flow, operating on a 128-bit data (state) from xmm1 with a 128-bit round key from xmm2/m128.</td></tr>
23 | <tr>
24 | <td>VEX.NDS.128.66.0F38.WIG DC /r VAESENC xmm1, xmm2, xmm3/m128</td>
25 | <td>RVM</td>
26 | <td>V/V</td>
27 | <td>Both AES and AVX flags</td>
28 | <td>Perform one round of an AES encryption flow, operating on a 128-bit data (state) from xmm2 with a 128-bit round key from the xmm3/m128; store the result in xmm1.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand2</td>
35 | <td>Operand3</td>
36 | <td>Operand4</td></tr>
37 | <tr>
38 | <td>RM</td>
39 | <td>ModRM:reg (r, w)</td>
40 | <td>ModRM:r/m (r)</td>
41 | <td>NA</td>
42 | <td>NA</td></tr>
43 | <tr>
44 | <td>RVM</td>
45 | <td>ModRM:reg (w)</td>
46 | <td>VEX.vvvv (r)</td>
47 | <td>ModRM:r/m (r)</td>
48 | <td>NA</td></tr></table>
49 | <h2>Description</h2>
50 | <p>This instruction performs a single round of an AES encryption flow using a round key from the second source operand, operating on 128-bit data (state) from the first source operand, and store the result in the destination operand.</p>
51 | <p>Use the AESENC instruction for all but the last encryption rounds. For the last encryption round, use the AESENC-CLAST instruction.</p>
52 | <p>128-bit Legacy SSE version: The first source operand and the destination operand are the same and must be an XMM register. The second source operand can be an XMM register or a 128-bit memory location. Bits (VLMAX-1:128) of the corresponding YMM destination register remain unchanged.</p>
53 | <p>VEX.128 encoded version: The first source operand and the destination operand are XMM registers. The second source operand can be an XMM register or a 128-bit memory location. Bits (VLMAX-1:128) of the destination YMM register are zeroed.</p>
54 | <h2>Operation</h2>
55 | <p><strong>AESENC</strong></p>
56 | <pre>STATE ← SRC1;
57 | RoundKey ← SRC2;
58 | STATE ← ShiftRows( STATE );
59 | STATE ← SubBytes( STATE );
60 | STATE ← MixColumns( STATE );
61 | DEST[127:0] ← STATE XOR RoundKey;
62 | DEST[VLMAX-1:128] (Unmodified)</pre>
63 | <p><strong>VAESENC</strong></p>
64 | <pre>STATE (cid:197) SRC1;
65 | RoundKey (cid:197) SRC2;
66 | STATE (cid:197) ShiftRows( STATE );
67 | STATE (cid:197) SubBytes( STATE );
68 | STATE (cid:197) MixColumns( STATE );
69 | DEST[127:0] (cid:197) STATE XOR RoundKey;
70 | DEST[VLMAX-1:128] (cid:197) 0</pre>
71 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
72 | <p>(V)AESENC:</p>
73 | <p>__m128i _mm_aesenc (__m128i, __m128i)</p>
74 | <h2>SIMD Floating-Point Exceptions</h2>
75 | <p>None</p>
76 | <h2>Other Exceptions</h2>
77 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/AESENCLAST.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>AESENCLAST—Perform Last Round of an AES Encryption Flow </title></head>
 8 | <body>
 9 | <h1>AESENCLAST—Perform Last Round of an AES Encryption Flow</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32-bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>66 0F 38 DD /r AESENCLAST xmm1, xmm2/m128</td>
19 | <td>RM</td>
20 | <td>V/V</td>
21 | <td>AES</td>
22 | <td>Perform the last round of an AES encryption flow, operating on a 128-bit data (state) from xmm1 with a 128-bit round key from xmm2/m128.</td></tr>
23 | <tr>
24 | <td>VEX.NDS.128.66.0F38.WIG DD /r VAESENCLAST xmm1, xmm2, xmm3/m128</td>
25 | <td>RVM</td>
26 | <td>V/V</td>
27 | <td>Both AES and AVX flags</td>
28 | <td>Perform the last round of an AES encryption flow, operating on a 128-bit data (state) from xmm2 with a 128 bit round key from xmm3/m128; store the result in xmm1.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand2</td>
35 | <td>Operand3</td>
36 | <td>Operand4</td></tr>
37 | <tr>
38 | <td>RM</td>
39 | <td>ModRM:reg (r, w)</td>
40 | <td>ModRM:r/m (r)</td>
41 | <td>NA</td>
42 | <td>NA</td></tr>
43 | <tr>
44 | <td>RVM</td>
45 | <td>ModRM:reg (w)</td>
46 | <td>VEX.vvvv (r)</td>
47 | <td>ModRM:r/m (r)</td>
48 | <td>NA</td></tr></table>
49 | <h2>Description</h2>
50 | <p>This instruction performs the last round of an AES encryption flow using a round key from the second source operand, operating on 128-bit data (state) from the first source operand, and store the result in the destination operand.</p>
51 | <p>128-bit Legacy SSE version: The first source operand and the destination operand are the same and must be an XMM register. The second source operand can be an XMM register or a 128-bit memory location. Bits (VLMAX-1:128) of the corresponding YMM destination register remain unchanged.</p>
52 | <p>VEX.128 encoded version: The first source operand and the destination operand are XMM registers. The second source operand can be an XMM register or a 128-bit memory location. Bits (VLMAX-1:128) of the destination YMM register are zeroed.</p>
53 | <h2>Operation</h2>
54 | <p><strong>AESENCLAST</strong></p>
55 | <pre>STATE ← SRC1;
56 | RoundKey ← SRC2;
57 | STATE ← ShiftRows( STATE );
58 | STATE ← SubBytes( STATE );
59 | DEST[127:0] ← STATE XOR RoundKey;
60 | DEST[VLMAX-1:128] (Unmodified)</pre>
61 | <p><strong>VAESENCLAST</strong></p>
62 | <pre>STATE (cid:197) SRC1;
63 | RoundKey (cid:197) SRC2;
64 | STATE (cid:197) ShiftRows( STATE );
65 | STATE (cid:197) SubBytes( STATE );
66 | DEST[127:0] (cid:197) STATE XOR RoundKey;
67 | DEST[VLMAX-1:128] (cid:197) 0</pre>
68 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
69 | <p>(V)AESENCLAST:</p>
70 | <p>__m128i _mm_aesenclast (__m128i, __m128i)</p>
71 | <h2>SIMD Floating-Point Exceptions</h2>
72 | <p>None</p>
73 | <h2>Other Exceptions</h2>
74 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/AESIMC.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>AESIMC—Perform the AES InvMixColumn Transformation </title></head>
 8 | <body>
 9 | <h1>AESIMC—Perform the AES InvMixColumn Transformation</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32-bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>66 0F 38 DB /r AESIMC xmm1, xmm2/m128</td>
19 | <td>RM</td>
20 | <td>V/V</td>
21 | <td>AES</td>
22 | <td>Perform the InvMixColumn transformation on a 128-bit round key from xmm2/m128 and store the result in xmm1.</td></tr>
23 | <tr>
24 | <td>VEX.128.66.0F38.WIG DB /r VAESIMC xmm1, xmm2/m128</td>
25 | <td>RM</td>
26 | <td>V/V</td>
27 | <td>Both AES and AVX flags</td>
28 | <td>Perform the InvMixColumn transformation on a 128-bit round key from xmm2/m128 and store the result in xmm1.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand2</td>
35 | <td>Operand3</td>
36 | <td>Operand4</td></tr>
37 | <tr>
38 | <td>RM</td>
39 | <td>ModRM:reg (w)</td>
40 | <td>ModRM:r/m (r)</td>
41 | <td>NA</td>
42 | <td>NA</td></tr></table>
43 | <h2>Description</h2>
44 | <p>Perform the InvMixColumns transformation on the source operand and store the result in the destination operand. The destination operand is an XMM register. The source operand can be an XMM register or a 128-bit memory loca-tion.</p>
45 | <p>Note: the AESIMC instruction should be applied to the expanded AES round keys (except for the first and last round key) in order to prepare them for decryption using the “Equivalent Inverse Cipher” (defined in FIPS 197).</p>
46 | <p>128-bit Legacy SSE version: Bits (VLMAX-1:128) of the corresponding YMM destination register remain unchanged.</p>
47 | <p>VEX.128 encoded version: Bits (VLMAX-1:128) of the destination YMM register are zeroed.</p>
48 | <p>Note: In VEX-encoded versions, VEX.vvvv is reserved and must be 1111b, otherwise instructions will #UD.</p>
49 | <h2>Operation</h2>
50 | <p><strong>AESIMC</strong></p>
51 | <pre>DEST[127:0] ← InvMixColumns( SRC );
52 | DEST[VLMAX-1:128] (Unmodified)</pre>
53 | <p><strong>VAESIMC</strong></p>
54 | <pre>DEST[127:0] (cid:197) InvMixColumns( SRC );
55 | DEST[VLMAX-1:128] (cid:197) 0;</pre>
56 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
57 | <p>(V)AESIMC:</p>
58 | <p>__m128i _mm_aesimc (__m128i)</p>
59 | <h2>SIMD Floating-Point Exceptions</h2>
60 | <p>None</p>
61 | <h2>Other Exceptions</h2>
62 | <p>See Exceptions Type 4; additionally</p>
63 | <table class="exception-table">
64 | <tr>
65 | <td>#UD</td>
66 | <td>If VEX.vvvv ≠ 1111B.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/ANDN.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>ANDN — Logical AND NOT </title></head>
 8 | <body>
 9 | <h1>ANDN — Logical AND NOT</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 -bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDS.LZ.0F38.W0 F2 /r ANDN r32a, r32b, r/m32</td>
19 | <td>RVM</td>
20 | <td>V/V</td>
21 | <td>BMI1</td>
22 | <td>Bitwise AND of inverted r32b with r/m32, store result in r32a.</td></tr>
23 | <tr>
24 | <td>VEX.NDS.LZ. 0F38.W1 F2 /r ANDN r64a, r64b, r/m64</td>
25 | <td>RVM</td>
26 | <td>V/NE</td>
27 | <td>BMI1</td>
28 | <td>Bitwise AND of inverted r64b with r/m64, store result in r64a.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand 2</td>
35 | <td>Operand 3</td>
36 | <td>Operand 4</td></tr>
37 | <tr>
38 | <td>RVM</td>
39 | <td>ModRM:reg (w)</td>
40 | <td>VEX.vvvv (r)</td>
41 | <td>ModRM:r/m (r)</td>
42 | <td>NA</td></tr></table>
43 | <h2>Description</h2>
44 | <p>Performs a bitwise logical AND of inverted second operand (the first source operand) with the third operand (the second source operand). The result is stored in the first operand (destination operand).</p>
45 | <p>This instruction is not supported in real mode and virtual-8086 mode. The operand size is always 32 bits if not in 64-bit mode. In 64-bit mode operand size 64 requires VEX.W1. VEX.W1 is ignored in non-64-bit modes. An attempt to execute this instruction with VEX.L not equal to 0 will cause #UD.</p>
46 | <h2>Operation</h2>
47 | <pre>DEST ← (NOT SRC1) bitwiseAND SRC2;
48 | SF ← DEST[OperandSize -1];
49 | ZF ← (DEST = 0);</pre>
50 | <h2>Flags Affected</h2>
51 | <p>SF and ZF are updated based on result. OF and CF flags are cleared. AF and PF flags are undefined.</p>
52 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
53 | <p>Auto-generated from high-level language.</p>
54 | <h2>SIMD Floating-Point Exceptions</h2>
55 | <p>None</p>
56 | <h2>Other Exceptions</h2>
57 | <p>See Section 2.5.1, “Exception Conditions for VEX-Encoded GPR Instructions”, Table 2-29; additionally</p>
58 | <table class="exception-table">
59 | <tr>
60 | <td>#UD</td>
61 | <td>If VEX.W = 1.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/BLSI.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>BLSI — Extract Lowest Set Isolated Bit </title></head>
 8 | <body>
 9 | <h1>BLSI — Extract Lowest Set Isolated Bit</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 -bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDD.LZ.0F38.W0 F3 /3 BLSI r32, r/m32</td>
19 | <td>VM</td>
20 | <td>V/V</td>
21 | <td>BMI1</td>
22 | <td>Extract lowest set bit from r/m32 and set that bit in r32.</td></tr>
23 | <tr>
24 | <td>VEX.NDD.LZ.0F38.W1 F3 /3 BLSI r64, r/m64</td>
25 | <td>VM</td>
26 | <td>V/N.E.</td>
27 | <td>BMI1</td>
28 | <td>Extract lowest set bit from r/m64, and set that bit in r64.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand 2</td>
35 | <td>Operand 3</td>
36 | <td>Operand 4</td></tr>
37 | <tr>
38 | <td>VM</td>
39 | <td>VEX.vvvv (w)</td>
40 | <td>ModRM:r/m (r)</td>
41 | <td>NA</td>
42 | <td>NA</td></tr></table>
43 | <h2>Description</h2>
44 | <p>Extracts the lowest set bit from the source operand and set the corresponding bit in the destination register. All other bits in the destination operand are zeroed. If no bits are set in the source operand, BLSI sets all the bits in the destination to 0 and sets ZF and CF.</p>
45 | <p>This instruction is not supported in real mode and virtual-8086 mode. The operand size is always 32 bits if not in 64-bit mode. In 64-bit mode operand size 64 requires VEX.W1. VEX.W1 is ignored in non-64-bit modes. An attempt to execute this instruction with VEX.L not equal to 0 will cause #UD.</p>
46 | <h2>Operation</h2>
47 | <pre>temp ← (-SRC) bitwiseAND (SRC);
48 | SF ← temp[OperandSize -1];
49 | ZF ← (temp = 0);
50 | IF SRC = 0
51 |     CF ← 0;
52 | ELSE
53 |     CF ← 1;
54 | FI
55 | DEST ← temp;</pre>
56 | <h2>Flags Affected</h2>
57 | <p>ZF and SF are updated based on the result. CF is set if the source is not zero. OF flags are cleared. AF and PF flags are undefined.</p>
58 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
59 | <p>BLSI:</p>
60 | <p>unsigned __int32 _blsi_u32(unsigned __int32 src);</p>
61 | <p>BLSI:</p>
62 | <p>unsigned __int64 _blsi_u64(unsigned __int64 src);</p>
63 | <h2>SIMD Floating-Point Exceptions</h2>
64 | <p>None</p>
65 | <h2>Other Exceptions</h2>
66 | <p>See Section 2.5.1, “Exception Conditions for VEX-Encoded GPR Instructions”, Table 2-29; additionally</p>
67 | <table class="exception-table">
68 | <tr>
69 | <td>#UD</td>
70 | <td>If VEX.W = 1.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/BLSMSK.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>BLSMSK — Get Mask Up to Lowest Set Bit </title></head>
 8 | <body>
 9 | <h1>BLSMSK — Get Mask Up to Lowest Set Bit</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 -bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDD.LZ.0F38.W0 F3 /2 BLSMSK r32, r/m32</td>
19 | <td>VM</td>
20 | <td>V/V</td>
21 | <td>BMI1</td>
22 | <td>Set all lower bits in r32 to “1” starting from bit 0 to lowest set bit in r/m32.</td></tr>
23 | <tr>
24 | <td>VEX.NDD.LZ.0F38.W1 F3 /2 BLSMSK r64, r/m64</td>
25 | <td>VM</td>
26 | <td>V/N.E.</td>
27 | <td>BMI1</td>
28 | <td>Set all lower bits in r64 to “1” starting from bit 0 to lowest set bit in r/m64.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand 2</td>
35 | <td>Operand 3</td>
36 | <td>Operand 4</td></tr>
37 | <tr>
38 | <td>VM</td>
39 | <td>VEX.vvvv (w)</td>
40 | <td>ModRM:r/m (r)</td>
41 | <td>NA</td>
42 | <td>NA</td></tr></table>
43 | <h2>Description</h2>
44 | <p>Sets all the lower bits of the destination operand to “1” up to and including lowest set bit (=1) in the source operand. If source operand is zero, BLSMSK sets all bits of the destination operand to 1 and also sets CF to 1.</p>
45 | <p>This instruction is not supported in real mode and virtual-8086 mode. The operand size is always 32 bits if not in 64-bit mode. In 64-bit mode operand size 64 requires VEX.W1. VEX.W1 is ignored in non-64-bit modes. An attempt to execute this instruction with VEX.L not equal to 0 will cause #UD.</p>
46 | <h2>Operation</h2>
47 | <pre>temp ← (SRC-1) XOR (SRC) ;
48 | SF ← temp[OperandSize -1];
49 | ZF ← 0;
50 | IF SRC = 0
51 |     CF ← 1;
52 | ELSE
53 |     CF ← 0;
54 | FI
55 | DEST ← temp;</pre>
56 | <h2>Flags Affected</h2>
57 | <p>SF is updated based on the result. CF is set if the source if zero. ZF and OF flags are cleared. AF and PF flag are undefined.</p>
58 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
59 | <p>BLSMSK:</p>
60 | <p>unsigned __int32 _blsmsk_u32(unsigned __int32 src);</p>
61 | <p>BLSMSK:</p>
62 | <p>unsigned __int64 _blsmsk_u64(unsigned __int64 src);</p>
63 | <h2>SIMD Floating-Point Exceptions</h2>
64 | <p>None</p>
65 | <h2>Other Exceptions</h2>
66 | <p>See Section 2.5.1, “Exception Conditions for VEX-Encoded GPR Instructions”, Table 2-29; additionally</p>
67 | <table class="exception-table">
68 | <tr>
69 | <td>#UD</td>
70 | <td>If VEX.W = 1.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/BLSR.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>BLSR — Reset Lowest Set Bit </title></head>
 8 | <body>
 9 | <h1>BLSR — Reset Lowest Set Bit</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 -bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDD.LZ.0F38.W0 F3 /1 BLSR r32, r/m32</td>
19 | <td>VM</td>
20 | <td>V/V</td>
21 | <td>BMI1</td>
22 | <td>Reset lowest set bit of r/m32, keep all other bits of r/m32 and write result to r32.</td></tr>
23 | <tr>
24 | <td>VEX.NDD.LZ.0F38.W1 F3 /1 BLSR r64, r/m64</td>
25 | <td>VM</td>
26 | <td>V/N.E.</td>
27 | <td>BMI1</td>
28 | <td>Reset lowest set bit of r/m64, keep all other bits of r/m64 and write result to r64.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand 2</td>
35 | <td>Operand 3</td>
36 | <td>Operand 4</td></tr>
37 | <tr>
38 | <td>VM</td>
39 | <td>VEX.vvvv (w)</td>
40 | <td>ModRM:r/m (r)</td>
41 | <td>NA</td>
42 | <td>NA</td></tr></table>
43 | <h2>Description</h2>
44 | <p>Copies all bits from the source operand to the destination operand and resets (=0) the bit position in the destina-tion operand that corresponds to the lowest set bit of the source operand. If the source operand is zero BLSR sets CF.</p>
45 | <p>This instruction is not supported in real mode and virtual-8086 mode. The operand size is always 32 bits if not in 64-bit mode. In 64-bit mode operand size 64 requires VEX.W1. VEX.W1 is ignored in non-64-bit modes. An attempt to execute this instruction with VEX.L not equal to 0 will cause #UD.</p>
46 | <h2>Operation</h2>
47 | <pre>temp ← (SRC-1) bitwiseAND ( SRC );
48 | SF ← temp[OperandSize -1];
49 | ZF ← (temp = 0);
50 | IF SRC = 0
51 |     CF ← 1;
52 | ELSE
53 |     CF ← 0;
54 | FI
55 | DEST ← temp;</pre>
56 | <h2>Flags Affected</h2>
57 | <p>ZF and SF flags are updated based on the result. CF is set if the source is zero. OF flag is cleared. AF and PF flags are undefined.</p>
58 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
59 | <p>BLSR:</p>
60 | <p>unsigned __int32 _blsr_u32(unsigned __int32 src);</p>
61 | <p>BLSR:</p>
62 | <p>unsigned __int64 _blsr_u64(unsigned __int64 src);</p>
63 | <h2>SIMD Floating-Point Exceptions</h2>
64 | <p>None</p>
65 | <h2>Other Exceptions</h2>
66 | <p>See Section 2.5.1, “Exception Conditions for VEX-Encoded GPR Instructions”, Table 2-29; additionally</p>
67 | <table class="exception-table">
68 | <tr>
69 | <td>#UD</td>
70 | <td>If VEX.W = 1.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/BSWAP.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>BSWAP—Byte Swap </title></head>
 8 | <body>
 9 | <h1>BSWAP—Byte Swap</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F C8+<em>rd</em></td>
20 | <td>BSWAP <em>r32</em></td>
21 | <td>O</td>
22 | <td>Valid*</td>
23 | <td>Valid</td>
24 | <td>Reverses the byte order of a 32-bit register.</td></tr>
25 | <tr>
26 | <td>REX.W + 0F C8+<em>rd</em></td>
27 | <td>BSWAP <em>r64</em></td>
28 | <td>O</td>
29 | <td>Valid</td>
30 | <td>N.E.</td>
31 | <td>Reverses the byte order of a 64-bit register.</td></tr></table>
32 | <p><strong>NOTES:</strong></p>
33 | <p>*</p>
34 | <p>See IA-32 Architecture Compatibility section below.</p>
35 | <h3>Instruction Operand Encoding</h3>
36 | <table>
37 | <tr>
38 | <td>Op/En</td>
39 | <td>Operand 1</td>
40 | <td>Operand 2</td>
41 | <td>Operand 3</td>
42 | <td>Operand 4</td></tr>
43 | <tr>
44 | <td>O</td>
45 | <td>opcode + rd (r, w)</td>
46 | <td>NA</td>
47 | <td>NA</td>
48 | <td>NA</td></tr></table>
49 | <h2>Description</h2>
50 | <p>Reverses the byte order of a 32-bit or 64-bit (destination) register. This instruction is provided for converting little-endian values to big-endian format and vice versa. To swap bytes in a word value (16-bit register), use the XCHG instruction. When the BSWAP instruction references a 16-bit register, the result is undefined.</p>
51 | <p>In 64-bit mode, the instruction’s default operation size is 32 bits. Using a REX prefix in the form of REX.R permits access to additional registers (R8-R15). Using a REX prefix in the form of REX.W promotes operation to 64 bits. See the summary chart at the beginning of this section for encoding data and limits.</p>
52 | <h2>IA-32 Architecture Legacy Compatibility</h2>
53 | <p>The BSWAP instruction is not supported on IA-32 processors earlier than the Intel486™ processor family. For compatibility with this instruction, software should include functionally equivalent code for execution on Intel processors earlier than the Intel486 processor family.</p>
54 | <h2>Operation</h2>
55 | <pre>TEMP ← DEST
56 | IF 64-bit mode AND OperandSize = 64
57 |     THEN
58 |          DEST[7:0] ← TEMP[63:56];
59 |          DEST[15:8] ← TEMP[55:48];
60 |          DEST[23:16] ← TEMP[47:40];
61 |          DEST[31:24] ← TEMP[39:32];
62 |          DEST[39:32] ← TEMP[31:24];
63 |          DEST[47:40] ← TEMP[23:16];
64 |          DEST[55:48] ← TEMP[15:8];
65 |          DEST[63:56] ← TEMP[7:0];
66 |     ELSE
67 |          DEST[7:0] ← TEMP[31:24];
68 |          DEST[15:8] ← TEMP[23:16];
69 |          DEST[23:16] ← TEMP[15:8];
70 |          DEST[31:24] ← TEMP[7:0];
71 | FI;</pre>
72 | <h2>Flags Affected</h2>
73 | <p>None.</p>
74 | <h2>Exceptions (All Operating Modes)</h2>
75 | <p>#UD</p>
76 | <p>If the LOCK prefix is used.</p></body></html>


--------------------------------------------------------------------------------
/html/BZHI.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>BZHI — Zero High Bits Starting with Specified Bit Position </title></head>
 8 | <body>
 9 | <h1>BZHI — Zero High Bits Starting with Specified Bit Position</h1>
10 | <table>
11 | <tr>
12 | <td>
13 | <p><strong>Opcode/Instruction</strong></p>
14 | <p>VEX.NDS<sup>1</sup>.LZ.0F38.W0 F5 /r BZHI r32a, r/m32, r32b</p>
15 | <p>VEX.NDS<sup>1</sup>.LZ.0F38.W1 F5 /r BZHI r64a, r/m64, r64b</p></td>
16 | <td>
17 | <p><strong>Op/En</strong></p>
18 | <p>RMV</p>
19 | <p>RMV</p></td>
20 | <td>
21 | <p><strong>64/32 -bit Mode</strong></p>
22 | <p>V/V</p>
23 | <p>V/N.E.</p></td>
24 | <td>
25 | <p><strong>CPUID Feature Flag</strong></p>
26 | <p>BMI2</p>
27 | <p>BMI2</p></td>
28 | <td>
29 | <p><strong>Description</strong></p>
30 | <p>Zero bits in r/m32 starting with the position in r32b, write result to r32a.</p>
31 | <p>Zero bits in r/m64 starting with the position in r64b, write result to r64a.</p></td></tr></table>
32 | <p><strong>NOTES:</strong></p>
33 | <p>1. ModRM:r/m is used to encode the first source operand (second operand) and VEX.vvvv encodes the second source operand (third</p>
34 | <p>operand).</p>
35 | <h3>Instruction Operand Encoding</h3>
36 | <table>
37 | <tr>
38 | <td>Op/En</td>
39 | <td>Operand 1</td>
40 | <td>Operand 2</td>
41 | <td>Operand 3</td>
42 | <td>Operand 4</td></tr>
43 | <tr>
44 | <td>RMV</td>
45 | <td>ModRM:reg (w)</td>
46 | <td>ModRM:r/m (r)</td>
47 | <td>VEX.vvvv (r)</td>
48 | <td>NA</td></tr></table>
49 | <h2>Description</h2>
50 | <p>BZHI copies the bits of the first source operand (the second operand) into the destination operand (the first operand) and clears the higher bits in the destination according to the INDEX value specified by the second source operand (the third operand). The INDEX is specified by bits 7:0 of the second source operand. The INDEX value is saturated at the value of OperandSize -1. CF is set, if the number contained in the 8 low bits of the third operand is greater than OperandSize -1.</p>
51 | <p>This instruction is not supported in real mode and virtual-8086 mode. The operand size is always 32 bits if not in 64-bit mode. In 64-bit mode operand size 64 requires VEX.W1. VEX.W1 is ignored in non-64-bit modes. An attempt to execute this instruction with VEX.L not equal to 0 will cause #UD.</p>
52 | <h2>Operation</h2>
53 | <pre>N ← SRC2[7:0]
54 | DEST ← SRC1
55 | IF (N &lt; OperandSize)
56 |     DEST[OperandSize-1:N] ← 0
57 | FI
58 | IF (N &gt; OperandSize - 1)
59 |     CF ← 1
60 | ELSE
61 |     CF ← 0
62 | FI</pre>
63 | <h2>Flags Affected</h2>
64 | <p>ZF, CF and SF flags are updated based on the result. OF flag is cleared. AF and PF flags are undefined.</p>
65 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
66 | <p>BZHI:</p>
67 | <p>unsigned __int32 _bzhi_u32(unsigned __int32 src, unsigned __int32 index);</p>
68 | <p>BZHI:</p>
69 | <p>unsigned __int64 _bzhi_u64(unsigned __int64 src, unsigned __int32 index);</p>
70 | <h2>SIMD Floating-Point Exceptions</h2>
71 | <p>None</p>
72 | <h2>Other Exceptions</h2>
73 | <p>See Section 2.5.1, “Exception Conditions for VEX-Encoded GPR Instructions”, Table 2-29; additionally</p>
74 | <table class="exception-table">
75 | <tr>
76 | <td>#UD</td>
77 | <td>If VEX.W = 1.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/CBW_CWDE_CDQE.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CBW/CWDE/CDQE—Convert Byte to Word/Convert Word to Doubleword/Convert Doubleword to Quadword </title></head>
 8 | <body>
 9 | <h1>CBW/CWDE/CDQE—Convert Byte to Word/Convert Word to Doubleword/Convert Doubleword to Quadword</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>98</td>
20 | <td>CBW</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>AX ← sign-extend of AL.</td></tr>
25 | <tr>
26 | <td>98</td>
27 | <td>CWDE</td>
28 | <td>NP</td>
29 | <td>Valid</td>
30 | <td>Valid</td>
31 | <td>EAX ← sign-extend of AX.</td></tr>
32 | <tr>
33 | <td>REX.W + 98</td>
34 | <td>CDQE</td>
35 | <td>NP</td>
36 | <td>Valid</td>
37 | <td>N.E.</td>
38 | <td>RAX ← sign-extend of EAX.</td></tr></table>
39 | <h3>Instruction Operand Encoding</h3>
40 | <table>
41 | <tr>
42 | <td>Op/En</td>
43 | <td>Operand 1</td>
44 | <td>Operand 2</td>
45 | <td>Operand 3</td>
46 | <td>Operand 4</td></tr>
47 | <tr>
48 | <td>NP</td>
49 | <td>NA</td>
50 | <td>NA</td>
51 | <td>NA</td>
52 | <td>NA</td></tr></table>
53 | <h2>Description</h2>
54 | <p>Double the size of the source operand by means of sign extension. The CBW (convert byte to word) instruction copies the sign (bit 7) in the source operand into every bit in the AH register. The CWDE (convert word to double-word) instruction copies the sign (bit 15) of the word in the AX register into the high 16 bits of the EAX register.</p>
55 | <p>CBW and CWDE reference the same opcode. The CBW instruction is intended for use when the operand-size attri-bute is 16; CWDE is intended for use when the operand-size attribute is 32. Some assemblers may force the operand size. Others may treat these two mnemonics as synonyms (CBW/CWDE) and use the setting of the operand-size attribute to determine the size of values to be converted.</p>
56 | <p>In 64-bit mode, the default operation size is the size of the destination register. Use of the REX.W prefix promotes this instruction (CDQE when promoted) to operate on 64-bit operands. In which case, CDQE copies the sign (bit 31) of the doubleword in the EAX register into the high 32 bits of RAX.</p>
57 | <h2>Operation</h2>
58 | <pre>IF OperandSize = 16 (* Instruction = CBW *)
59 |     THEN
60 |          AX ← SignExtend(AL);
61 |     ELSE IF (OperandSize = 32, Instruction = CWDE)
62 |          EAX ← SignExtend(AX); FI;
63 |     ELSE (* 64-Bit Mode, OperandSize = 64, Instruction = CDQE*)
64 |          RAX ← SignExtend(EAX);
65 | FI;</pre>
66 | <h2>Flags Affected</h2>
67 | <p>None.</p>
68 | <h2>Exceptions (All Operating Modes)</h2>
69 | <p>#UD</p>
70 | <p>If the LOCK prefix is used.</p></body></html>


--------------------------------------------------------------------------------
/html/CLAC.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CLAC—Clear AC Flag in EFLAGS Register </title></head>
 8 | <body>
 9 | <h1>CLAC—Clear AC Flag in EFLAGS Register</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F 01 CA</td>
20 | <td>CLAC</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Clear the AC flag in the EFLAGS register.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Clears the AC flag bit in EFLAGS register. This disables any alignment checking of user-mode data accesses. If the SMAP bit is set in the CR4 register, this disallows explicit supervisor-mode data accesses to user-mode pages.</p>
41 | <p>This instruction's operation is the same in non-64-bit modes and 64-bit mode. Attempts to execute CLAC when CPL &gt; 0 cause #UD.</p>
42 | <h2>Operation</h2>
43 | <pre>EFLAGS.AC ← 0;</pre>
44 | <h2>Flags Affected</h2>
45 | <p>AC cleared. Other flags are unaffected.</p>
46 | <h2>Protected Mode Exceptions</h2>
47 | <table class="exception-table">
48 | <tr>
49 | <td>#UD</td>
50 | <td>
51 | <p>If the LOCK prefix is used.</p>
52 | <p>If the CPL &gt; 0.</p>
53 | <p>If CPUID.(EAX=07H, ECX=0H):EBX.SMAP[bit 20] = 0.</p></td></tr></table>
54 | <h2>Real-Address Mode Exceptions</h2>
55 | <table class="exception-table">
56 | <tr>
57 | <td>#UD</td>
58 | <td>
59 | <p>If the LOCK prefix is used.</p>
60 | <p>If CPUID.(EAX=07H, ECX=0H):EBX.SMAP[bit 20] = 0.</p></td></tr></table>
61 | <h2>Virtual-8086 Mode Exceptions</h2>
62 | <table class="exception-table">
63 | <tr>
64 | <td>#UD</td>
65 | <td>The CLAC instruction is not recognized in virtual-8086 mode.</td></tr></table>
66 | <h2>Compatibility Mode Exceptions</h2>
67 | <table class="exception-table">
68 | <tr>
69 | <td>#UD</td>
70 | <td>
71 | <p>If the LOCK prefix is used.</p>
72 | <p>If the CPL &gt; 0.</p>
73 | <p>If CPUID.(EAX=07H, ECX=0H):EBX.SMAP[bit 20] = 0.</p></td></tr></table>
74 | <h2>64-Bit Mode Exceptions</h2>
75 | <table class="exception-table">
76 | <tr>
77 | <td>#UD</td>
78 | <td>
79 | <p>If the LOCK prefix is used.</p>
80 | <p>If the CPL &gt; 0.</p>
81 | <p>If CPUID.(EAX=07H, ECX=0H):EBX.SMAP[bit 20] = 0.</p></td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/CLC.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CLC—Clear Carry Flag </title></head>
 8 | <body>
 9 | <h1>CLC—Clear Carry Flag</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>F8</td>
20 | <td>CLC</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Clear CF flag.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Clears the CF flag in the EFLAGS register. Operation is the same in all modes.</p>
41 | <h2>Operation</h2>
42 | <pre>CF ← 0;</pre>
43 | <h2>Flags Affected</h2>
44 | <p>The CF flag is set to 0. The OF, ZF, SF, AF, and PF flags are unaffected.</p>
45 | <h2>Exceptions (All Operating Modes)</h2>
46 | <p>#UD</p>
47 | <p>If the LOCK prefix is used.</p></body></html>


--------------------------------------------------------------------------------
/html/CLD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CLD—Clear Direction Flag </title></head>
 8 | <body>
 9 | <h1>CLD—Clear Direction Flag</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>FC</td>
20 | <td>CLD</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Clear DF flag.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Clears the DF flag in the EFLAGS register. When the DF flag is set to 0, string operations increment the index regis-ters (ESI and/or EDI). Operation is the same in all modes.</p>
41 | <h2>Operation</h2>
42 | <pre>DF ← 0;</pre>
43 | <h2>Flags Affected</h2>
44 | <p>The DF flag is set to 0. The CF, OF, ZF, SF, AF, and PF flags are unaffected.</p>
45 | <h2>Exceptions (All Operating Modes)</h2>
46 | <p>#UD</p>
47 | <p>If the LOCK prefix is used.</p></body></html>


--------------------------------------------------------------------------------
/html/CLTS.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CLTS—Clear Task-Switched Flag in CR0 </title></head>
 8 | <body>
 9 | <h1>CLTS—Clear Task-Switched Flag in CR0</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F 06</td>
20 | <td>CLTS</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Clears TS flag in CR0.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Clears the task-switched (TS) flag in the CR0 register. This instruction is intended for use in operating-system procedures. It is a privileged instruction that can only be executed at a CPL of 0. It is allowed to be executed in real-address mode to allow initialization for protected mode.</p>
41 | <p>The processor sets the TS flag every time a task switch occurs. The flag is used to synchronize the saving of FPU context in multitasking applications. See the description of the TS flag in the section titled “Control Registers” in Chapter 2 of the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3A</em>, for more information about this flag.</p>
42 | <p>CLTS operation is the same in non-64-bit modes and 64-bit mode.</p>
43 | <p>See Chapter 25, “VMX Non-Root Operation,” of the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3C</em>, for more information about the behavior of this instruction in VMX non-root operation.</p>
44 | <h2>Operation</h2>
45 | <pre>CR0.TS[bit 3] ← 0;</pre>
46 | <h2>Flags Affected</h2>
47 | <p>The TS flag in CR0 register is cleared.</p>
48 | <h2>Protected Mode Exceptions</h2>
49 | <table class="exception-table">
50 | <tr>
51 | <td>#GP(0)</td>
52 | <td>If the current privilege level is not 0.</td></tr>
53 | <tr>
54 | <td>#UD</td>
55 | <td>If the LOCK prefix is used.</td></tr></table>
56 | <h2>Real-Address Mode Exceptions</h2>
57 | <table class="exception-table">
58 | <tr>
59 | <td>#UD</td>
60 | <td>If the LOCK prefix is used.</td></tr></table>
61 | <h2>Virtual-8086 Mode Exceptions</h2>
62 | <table class="exception-table">
63 | <tr>
64 | <td>#GP(0)</td>
65 | <td>CLTS is not recognized in virtual-8086 mode.</td></tr>
66 | <tr>
67 | <td>#UD</td>
68 | <td>If the LOCK prefix is used.</td></tr></table>
69 | <h2>Compatibility Mode Exceptions</h2>
70 | <p>Same exceptions as in protected mode.</p>
71 | <h2>64-Bit Mode Exceptions</h2>
72 | <table class="exception-table">
73 | <tr>
74 | <td>#GP(0)</td>
75 | <td>If the CPL is greater than 0.</td></tr>
76 | <tr>
77 | <td>#UD</td>
78 | <td>If the LOCK prefix is used.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/CMC.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CMC—Complement Carry Flag </title></head>
 8 | <body>
 9 | <h1>CMC—Complement Carry Flag</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>F5</td>
20 | <td>CMC</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Complement CF flag.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Complements the CF flag in the EFLAGS register. CMC operation is the same in non-64-bit modes and 64-bit mode.</p>
41 | <h2>Operation</h2>
42 | <pre>EFLAGS.CF[bit 0]← NOT EFLAGS.CF[bit 0];</pre>
43 | <h2>Flags Affected</h2>
44 | <p>The CF flag contains the complement of its original value. The OF, ZF, SF, AF, and PF flags are unaffected.</p>
45 | <h2>Exceptions (All Operating Modes)</h2>
46 | <p>#UD</p>
47 | <p>If the LOCK prefix is used.</p></body></html>


--------------------------------------------------------------------------------
/html/CVTPD2PI.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CVTPD2PI—Convert Packed Double-Precision FP Values to Packed Dword Integers </title></head>
 8 | <body>
 9 | <h1>CVTPD2PI—Convert Packed Double-Precision FP Values to Packed Dword Integers</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>66 0F 2D /<em>r</em></p>
20 | <p>CVTPD2PI <em>mm</em>, <em>xmm/m128</em></p></td>
21 | <td>RM</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Convert two packed double-precision floating-point values from <em>xmm/m128</em> to two packed signed doubleword integers in <em>mm</em>.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>RM</td>
35 | <td>ModRM:reg (w)</td>
36 | <td>ModRM:r/m (r)</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Converts two packed double-precision floating-point values in the source operand (second operand) to two packed signed doubleword integers in the destination operand (first operand).</p>
41 | <p>The source operand can be an XMM register or a 128-bit memory location. The destination operand is an MMX tech-nology register.</p>
42 | <p>When a conversion is inexact, the value returned is rounded according to the rounding control bits in the MXCSR register. If a converted result is larger than the maximum signed doubleword integer, the floating-point invalid exception is raised, and if this exception is masked, the indefinite integer value (80000000H) is returned.</p>
43 | <p>This instruction causes a transition from x87 FPU to MMX technology operation (that is, the x87 FPU top-of-stack pointer is set to 0 and the x87 FPU tag word is set to all 0s [valid]). If this instruction is executed while an x87 FPU floating-point exception is pending, the exception is handled before the CVTPD2PI instruction is executed.</p>
44 | <p>In 64-bit mode, use of the REX.R prefix permits this instruction to access additional registers (XMM8-XMM15).</p>
45 | <h2>Operation</h2>
46 | <pre>DEST[31:0] ← Convert_Double_Precision_Floating_Point_To_Integer32(SRC[63:0]);
47 | DEST[63:32] ← Convert_Double_Precision_Floating_Point_To_Integer32(SRC[127:64]);</pre>
48 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
49 | <p>CVTPD1PI:</p>
50 | <p>__m64 _mm_cvtpd_pi32(__m128d a)</p>
51 | <h2>SIMD Floating-Point Exceptions</h2>
52 | <p>Invalid, Precision.</p>
53 | <h2>Other Exceptions</h2>
54 | <p>See Table 22-4, “Exception Conditions for Legacy SIMD/MMX Instructions with FP Exception and 16-Byte Align-ment,” in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3B</em>.</p></body></html>


--------------------------------------------------------------------------------
/html/CVTPI2PD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CVTPI2PD—Convert Packed Dword Integers to Packed Double-Precision FP Values </title></head>
 8 | <body>
 9 | <h1>CVTPI2PD—Convert Packed Dword Integers to Packed Double-Precision FP Values</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>66 0F 2A /<em>r</em></p>
20 | <p>CVTPI2PD <em>xmm</em>, <em>mm/m64*</em></p></td>
21 | <td>RM</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Convert two packed signed doubleword integers from <em>mm/mem64</em> to two packed double-precision floating-point values in <em>xmm</em>.</td></tr></table>
25 | <p><strong>NOTES: *Operation is different for different operand sets; see the Description section.</strong></p>
26 | <h3>Instruction Operand Encoding</h3>
27 | <table>
28 | <tr>
29 | <td>Op/En</td>
30 | <td>Operand 1</td>
31 | <td>Operand 2</td>
32 | <td>Operand 3</td>
33 | <td>Operand 4</td></tr>
34 | <tr>
35 | <td>RM</td>
36 | <td>ModRM:reg (w)</td>
37 | <td>ModRM:r/m (r)</td>
38 | <td>NA</td>
39 | <td>NA</td></tr></table>
40 | <h2>Description</h2>
41 | <p>Converts two packed signed doubleword integers in the source operand (second operand) to two packed double-precision floating-point values in the destination operand (first operand).</p>
42 | <p>The source operand can be an MMX technology register or a 64-bit memory location. The destination operand is an XMM register. In addition, depending on the operand configuration:</p>
43 | <p>In 64-bit mode, use of the REX.R prefix permits this instruction to access additional registers (XMM8-XMM15).</p>
44 | <h2>Operation</h2>
45 | <pre>DEST[63:0] ← Convert_Integer_To_Double_Precision_Floating_Point(SRC[31:0]);
46 | DEST[127:64] ← Convert_Integer_To_Double_Precision_Floating_Point(SRC[63:32]);</pre>
47 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
48 | <p>CVTPI2PD:</p>
49 | <p>__m128d _mm_cvtpi32_pd(__m64 a)</p>
50 | <h2>SIMD Floating-Point Exceptions</h2>
51 | <p>None</p>
52 | <h2>Other Exceptions</h2>
53 | <p>See Table 22-6, “Exception Conditions for Legacy SIMD/MMX Instructions with XMM and without FP Exception,” in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3B</em>.</p></body></html>


--------------------------------------------------------------------------------
/html/CVTPI2PS.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CVTPI2PS—Convert Packed Dword Integers to Packed Single-Precision FP Values </title></head>
 8 | <body>
 9 | <h1>CVTPI2PS—Convert Packed Dword Integers to Packed Single-Precision FP Values</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 2A /<em>r</em></p>
20 | <p>CVTPI2PS <em>xmm</em>, <em>mm</em>/<em>m64</em></p></td>
21 | <td>RM</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Convert two signed doubleword integers from <em>mm</em>/<em>m64</em> to two single-precision floating-point values in <em>xmm</em>.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>RM</td>
35 | <td>ModRM:reg (w)</td>
36 | <td>ModRM:r/m (r)</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Converts two packed signed doubleword integers in the source operand (second operand) to two packed single-precision floating-point values in the destination operand (first operand).</p>
41 | <p>The source operand can be an MMX technology register or a 64-bit memory location. The destination operand is an XMM register. The results are stored in the low quadword of the destination operand, and the high quadword remains unchanged. When a conversion is inexact, the value returned is rounded according to the rounding control bits in the MXCSR register.</p>
42 | <p>This instruction causes a transition from x87 FPU to MMX technology operation (that is, the x87 FPU top-of-stack pointer is set to 0 and the x87 FPU tag word is set to all 0s [valid]). If this instruction is executed while an x87 FPU floating-point exception is pending, the exception is handled before the CVTPI2PS instruction is executed.</p>
43 | <p>In 64-bit mode, use of the REX.R prefix permits this instruction to access additional registers (XMM8-XMM15).</p>
44 | <h2>Operation</h2>
45 | <pre>DEST[31:0] ← Convert_Integer_To_Single_Precision_Floating_Point(SRC[31:0]);
46 | DEST[63:32] ← Convert_Integer_To_Single_Precision_Floating_Point(SRC[63:32]);
47 | (* High quadword of destination unchanged *)</pre>
48 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
49 | <p>CVTPI2PS:</p>
50 | <p>__m128 _mm_cvtpi32_ps(__m128 a, __m64 b)</p>
51 | <h2>SIMD Floating-Point Exceptions</h2>
52 | <p>Precision</p>
53 | <h2>Other Exceptions</h2>
54 | <p>See Table 22-5, “Exception Conditions for Legacy SIMD/MMX Instructions with XMM and FP Exception,” in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3B</em>.</p></body></html>


--------------------------------------------------------------------------------
/html/CVTPS2PI.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CVTPS2PI—Convert Packed Single-Precision FP Values to Packed Dword Integers </title></head>
 8 | <body>
 9 | <h1>CVTPS2PI—Convert Packed Single-Precision FP Values to Packed Dword Integers</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 2D /<em>r</em></p>
20 | <p>CVTPS2PI <em>mm, xmm/m64</em></p></td>
21 | <td>RM</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Convert two packed single-precision floating-point values from <em>xmm</em>/<em>m64</em> to two packed signed doubleword integers in <em>mm</em>.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>RM</td>
35 | <td>ModRM:reg (w)</td>
36 | <td>ModRM:r/m (r)</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Converts two packed single-precision floating-point values in the source operand (second operand) to two packed signed doubleword integers in the destination operand (first operand).</p>
41 | <p>The source operand can be an XMM register or a 128-bit memory location. The destination operand is an MMX tech-nology register. When the source operand is an XMM register, the two single-precision floating-point values are contained in the low quadword of the register. When a conversion is inexact, the value returned is rounded according to the rounding control bits in the MXCSR register. If a converted result is larger than the maximum signed doubleword integer, the floating-point invalid exception is raised, and if this exception is masked, the indef-inite integer value (80000000H) is returned.</p>
42 | <p>CVTPS2PI causes a transition from x87 FPU to MMX technology operation (that is, the x87 FPU top-of-stack pointer is set to 0 and the x87 FPU tag word is set to all 0s [valid]). If this instruction is executed while an x87 FPU floating-point exception is pending, the exception is handled before the CVTPS2PI instruction is executed.</p>
43 | <p>In 64-bit mode, use of the REX.R prefix permits this instruction to access additional registers (XMM8-XMM15).</p>
44 | <h2>Operation</h2>
45 | <pre>DEST[31:0] ← Convert_Single_Precision_Floating_Point_To_Integer(SRC[31:0]);
46 | DEST[63:32] ← Convert_Single_Precision_Floating_Point_To_Integer(SRC[63:32]);</pre>
47 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
48 | <p>CVTPS2PI:</p>
49 | <p>__m64 _mm_cvtps_pi32(__m128 a)</p>
50 | <h2>SIMD Floating-Point Exceptions</h2>
51 | <p>Invalid, Precision</p>
52 | <h2>Other Exceptions</h2>
53 | <p>See Table 22-5, “Exception Conditions for Legacy SIMD/MMX Instructions with XMM and FP Exception,” in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3B</em>.</p></body></html>


--------------------------------------------------------------------------------
/html/CVTTPD2PI.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CVTTPD2PI—Convert with Truncation Packed Double-Precision FP Values to Packed Dword Integers </title></head>
 8 | <body>
 9 | <h1>CVTTPD2PI—Convert with Truncation Packed Double-Precision FP Values to Packed Dword Integers</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>66 0F 2C /<em>r</em></p>
20 | <p>CVTTPD2PI <em>mm</em>, <em>xmm/m128</em></p></td>
21 | <td>RM</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Convert two packer double-precision floating-point values from <em>xmm/m128</em> to two packed signed doubleword integers in <em>mm</em> using truncation.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>RM</td>
35 | <td>ModRM:reg (w)</td>
36 | <td>ModRM:r/m (r)</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Converts two packed double-precision floating-point values in the source operand (second operand) to two packed signed doubleword integers in the destination operand (first operand). The source operand can be an XMM register or a 128-bit memory location. The destination operand is an MMX technology register.</p>
41 | <p>When a conversion is inexact, a truncated (round toward zero) result is returned. If a converted result is larger than the maximum signed doubleword integer, the floating-point invalid exception is raised, and if this exception is masked, the indefinite integer value (80000000H) is returned.</p>
42 | <p>This instruction causes a transition from x87 FPU to MMX technology operation (that is, the x87 FPU top-of-stack pointer is set to 0 and the x87 FPU tag word is set to all 0s [valid]). If this instruction is executed while an x87 FPU floating-point exception is pending, the exception is handled before the CVTTPD2PI instruction is executed.</p>
43 | <p>In 64-bit mode, use of the REX.R prefix permits this instruction to access additional registers (XMM8-XMM15).</p>
44 | <h2>Operation</h2>
45 | <pre>DEST[31:0] ← Convert_Double_Precision_Floating_Point_To_Integer32_Truncate(SRC[63:0]);
46 | DEST[63:32] ← Convert_Double_Precision_Floating_Point_To_Integer32_
47 |                     Truncate(SRC[127:64]);</pre>
48 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
49 | <p>CVTTPD1PI:</p>
50 | <p> __m64 _mm_cvttpd_pi32(__m128d a)</p>
51 | <h2>SIMD Floating-Point Exceptions</h2>
52 | <p>Invalid, Precision</p>
53 | <h2>Other Mode Exceptions</h2>
54 | <p>See Table 22-4, “Exception Conditions for Legacy SIMD/MMX Instructions with FP Exception and 16-Byte Align-ment,” in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3B</em>.</p></body></html>


--------------------------------------------------------------------------------
/html/CVTTPS2PI.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>CVTTPS2PI—Convert with Truncation Packed Single-Precision FP Values to Packed Dword Integers </title></head>
 8 | <body>
 9 | <h1>CVTTPS2PI—Convert with Truncation Packed Single-Precision FP Values to Packed Dword Integers</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 2C /r</p>
20 | <p>CVTTPS2PI <em>mm</em>, <em>xmm/m64</em></p></td>
21 | <td>RM</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Convert two single-precision floating-point values from <em>xmm</em>/<em>m64</em> to two signed doubleword signed integers in <em>mm</em> using truncation.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>RM</td>
35 | <td>ModRM:reg (w)</td>
36 | <td>ModRM:r/m (r)</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Converts two packed single-precision floating-point values in the source operand (second operand) to two packed signed doubleword integers in the destination operand (first operand). The source operand can be an XMM register or a 64-bit memory location. The destination operand is an MMX technology register. When the source operand is an XMM register, the two single-precision floating-point values are contained in the low quadword of the register.</p>
41 | <p>When a conversion is inexact, a truncated (round toward zero) result is returned. If a converted result is larger than the maximum signed doubleword integer, the floating-point invalid exception is raised, and if this exception is masked, the indefinite integer value (80000000H) is returned.</p>
42 | <p>This instruction causes a transition from x87 FPU to MMX technology operation (that is, the x87 FPU top-of-stack pointer is set to 0 and the x87 FPU tag word is set to all 0s [valid]). If this instruction is executed while an x87 FPU floating-point exception is pending, the exception is handled before the CVTTPS2PI instruction is executed.</p>
43 | <p>In 64-bit mode, use of the REX.R prefix permits this instruction to access additional registers (XMM8-XMM15).</p>
44 | <h2>Operation</h2>
45 | <pre>DEST[31:0] ← Convert_Single_Precision_Floating_Point_To_Integer_Truncate(SRC[31:0]);
46 | DEST[63:32] ← Convert_Single_Precision_Floating_Point_To_Integer_Truncate(SRC[63:32]);</pre>
47 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
48 | <p>CVTTPS2PI:</p>
49 | <p>__m64 _mm_cvttps_pi32(__m128 a)</p>
50 | <h2>SIMD Floating-Point Exceptions</h2>
51 | <p>Invalid, Precision</p>
52 | <h2>Other Exceptions</h2>
53 | <p>See Table 22-5, “Exception Conditions for Legacy SIMD/MMX Instructions with XMM and FP Exception,” in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3B</em>.</p></body></html>


--------------------------------------------------------------------------------
/html/EMMS.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>EMMS—Empty MMX Technology State </title></head>
 8 | <body>
 9 | <h1>EMMS—Empty MMX Technology State</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F 77</td>
20 | <td>EMMS</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Set the x87 FPU tag word to empty.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Sets the values of all the tags in the x87 FPU tag word to empty (all 1s). This operation marks the x87 FPU data registers (which are aliased to the MMX technology registers) as available for use by x87 FPU floating-point instruc-tions. (See Figure 8-7 in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 1</em>, for the format of the x87 FPU tag word.) All other MMX instructions (other than the EMMS instruction) set all the tags in x87 FPU tag word to valid (all 0s).</p>
41 | <p>The EMMS instruction must be used to clear the MMX technology state at the end of all MMX technology procedures or subroutines and before calling other procedures or subroutines that may execute x87 floating-point instructions. If a floating-point instruction loads one of the registers in the x87 FPU data register stack before the x87 FPU tag word has been reset by the EMMS instruction, an x87 floating-point register stack overflow can occur that will result in an x87 floating-point exception or incorrect result.</p>
42 | <p>EMMS operation is the same in non-64-bit modes and 64-bit mode.</p>
43 | <h2>Operation</h2>
44 | <pre>x87FPUTagWord ← FFFFH;</pre>
45 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
46 | <p>void _mm_empty()</p>
47 | <h2>Flags Affected</h2>
48 | <p>None</p>
49 | <h2>Protected Mode Exceptions</h2>
50 | <table class="exception-table">
51 | <tr>
52 | <td>#UD</td>
53 | <td>If CR0.EM[bit 2] = 1.</td></tr>
54 | <tr>
55 | <td>#NM</td>
56 | <td>If CR0.TS[bit 3] = 1.</td></tr>
57 | <tr>
58 | <td>#MF</td>
59 | <td>If there is a pending FPU exception.</td></tr>
60 | <tr>
61 | <td>#UD</td>
62 | <td>If the LOCK prefix is used.</td></tr></table>
63 | <h2>Real-Address Mode Exceptions</h2>
64 | <p>Same exceptions as in protected mode.</p>
65 | <h2>Virtual-8086 Mode Exceptions</h2>
66 | <p>Same exceptions as in protected mode.</p>
67 | <h2>Compatibility Mode Exceptions</h2>
68 | <p>Same exceptions as in protected mode.</p>
69 | <h2>64-Bit Mode Exceptions</h2>
70 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/F2XM1.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>F2XM1—Compute 2x–1 </title></head>
 8 | <body>
 9 | <h1>F2XM1—Compute 2<sup>x</sup>–1</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>D9 F0</td>
19 | <td>F2XM1</td>
20 | <td>Valid</td>
21 | <td>Valid</td>
22 | <td>Replace ST(0) with (2<sup>ST(0)<sup> </sup>– 1).</sup></td></tr></table>
23 | <h2>Description</h2>
24 | <p>Computes the exponential value of 2 to the power of the source operand minus 1. The source operand is located in register ST(0) and the result is also stored in ST(0). The value of the source operand must lie in the range –1.0 to +1.0. If the source value is outside this range, the result is undefined.</p>
25 | <p>The following table shows the results obtained when computing the exponential value of various classes of numbers, assuming that neither overflow nor underflow occurs.</p>
26 | <h3>Table 3-16.  Results Obtained from F2XM1</h3>
27 | <table>
28 | <tr>
29 | <th>ST(0) SRC</th>
30 | <th>ST(0) DEST</th></tr>
31 | <tr>
32 | <td>− 1.0 to −0</td>
33 | <td>− 0.5 to − 0</td></tr>
34 | <tr>
35 | <td>− 0</td>
36 | <td>− 0</td></tr>
37 | <tr>
38 | <td>+ 0</td>
39 | <td>+ 0</td></tr>
40 | <tr>
41 | <td>+ 0 to +1.0</td>
42 | <td>+ 0 to 1.0</td></tr></table>
43 | <p>Values other than 2 can be exponentiated using the following formula:</p>
44 | <p>x<sup>y</sup> ← 2<sup>(y ∗ log<sub>2<sup>x)</sup></sub></sup></p>
45 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
46 | <h2>Operation</h2>
47 | <pre>ST(0) ← (2<sup>ST(0)</sup> − 1);</pre>
48 | <h2>FPU Flags Affected</h2>
49 | <table class="exception-table">
50 | <tr>
51 | <td>C1</td>
52 | <td>
53 | <p>Set to 0 if stack underflow occurred.</p>
54 | <p>Set if result was rounded up; cleared otherwise.</p></td></tr>
55 | <tr>
56 | <td>C0, C2, C3</td>
57 | <td>Undefined.</td></tr></table>
58 | <h2>Floating-Point Exceptions</h2>
59 | <table class="exception-table">
60 | <tr>
61 | <td>#IS</td>
62 | <td>Stack underflow occurred.</td></tr>
63 | <tr>
64 | <td>#IA</td>
65 | <td>Source operand is an SNaN value or unsupported format.</td></tr></table>
66 | <p>#D</p>
67 | <p>Source is a denormal value.</p>
68 | <p>#U</p>
69 | <p>Result is too small for destination format.</p>
70 | <p>#P</p>
71 | <p>Value cannot be represented exactly in destination format.</p>
72 | <h2>Protected Mode Exceptions</h2>
73 | <table class="exception-table">
74 | <tr>
75 | <td>#NM</td>
76 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
77 | <tr>
78 | <td>#UD</td>
79 | <td>If the LOCK prefix is used.</td></tr></table>
80 | <h2>Real-Address Mode Exceptions</h2>
81 | <p>Same exceptions as in protected mode.</p>
82 | <h2>Virtual-8086 Mode Exceptions</h2>
83 | <p>Same exceptions as in protected mode.</p>
84 | <h2>Compatibility Mode Exceptions</h2>
85 | <p>Same exceptions as in protected mode.</p>
86 | <h2>64-Bit Mode Exceptions</h2>
87 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FABS.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>FABS—Absolute Value </title></head>
 8 | <body>
 9 | <h1>FABS—Absolute Value</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>D9 E1</td>
19 | <td>FABS</td>
20 | <td>Valid</td>
21 | <td>Valid</td>
22 | <td>Replace ST with its absolute value.</td></tr></table>
23 | <h2>Description</h2>
24 | <p>Clears the sign bit of ST(0) to create the absolute value of the operand. The following table shows the results obtained when creating the absolute value of various classes of numbers.</p>
25 | <h3>Table 3-17.  Results Obtained from FABS</h3>
26 | <table>
27 | <tr>
28 | <th>ST(0) SRC</th>
29 | <th>ST(0) DEST</th></tr>
30 | <tr>
31 | <td>− ∞</td>
32 | <td>+ ∞</td></tr>
33 | <tr>
34 | <td>− F</td>
35 | <td>+ F</td></tr>
36 | <tr>
37 | <td>− 0</td>
38 | <td>+ 0</td></tr>
39 | <tr>
40 | <td>+ 0</td>
41 | <td>+ 0</td></tr>
42 | <tr>
43 | <td>+ F</td>
44 | <td>+ F</td></tr>
45 | <tr>
46 | <td>+ ∞</td>
47 | <td>+ ∞</td></tr>
48 | <tr>
49 | <td>NaN</td>
50 | <td>NaN</td></tr></table>
51 | <p><strong>NOTES:</strong></p>
52 | <p>F Means finite floating-point value.</p>
53 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
54 | <h2>Operation</h2>
55 | <pre>ST(0) ← |ST(0)|;</pre>
56 | <h2>FPU Flags Affected</h2>
57 | <table class="exception-table">
58 | <tr>
59 | <td>C1</td>
60 | <td>Set to 0.</td></tr>
61 | <tr>
62 | <td>C0, C2, C3</td>
63 | <td>Undefined.</td></tr></table>
64 | <h2>Floating-Point Exceptions</h2>
65 | <table class="exception-table">
66 | <tr>
67 | <td>#IS</td>
68 | <td>Stack underflow occurred.</td></tr></table>
69 | <h2>Protected Mode Exceptions</h2>
70 | <table class="exception-table">
71 | <tr>
72 | <td>#NM</td>
73 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
74 | <tr>
75 | <td>#UD</td>
76 | <td>If the LOCK prefix is used.</td></tr></table>
77 | <h2>Real-Address Mode Exceptions</h2>
78 | <p>Same exceptions as in protected mode.</p>
79 | <h2>Virtual-8086 Mode Exceptions</h2>
80 | <p>Same exceptions as in protected mode.</p>
81 | <h2>Compatibility Mode Exceptions</h2>
82 | <p>Same exceptions as in protected mode.</p>
83 | <h2>64-Bit Mode Exceptions</h2>
84 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FCHS.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>FCHS—Change Sign </title></head>
 8 | <body>
 9 | <h1>FCHS—Change Sign</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>D9 E0</td>
19 | <td>FCHS</td>
20 | <td>Valid</td>
21 | <td>Valid</td>
22 | <td>Complements sign of ST(0).</td></tr></table>
23 | <h2>Description</h2>
24 | <p>Complements the sign bit of ST(0). This operation changes a positive value into a negative value of equal magni-tude or vice versa. The following table shows the results obtained when changing the sign of various classes of numbers.</p>
25 | <h3>Table 3-20.  FCHS Results</h3>
26 | <table>
27 | <tr>
28 | <th>ST(0) SRC</th>
29 | <th>ST(0) DEST</th></tr>
30 | <tr>
31 | <td>− ∞</td>
32 | <td>+ ∞</td></tr>
33 | <tr>
34 | <td>− F</td>
35 | <td>+ F</td></tr>
36 | <tr>
37 | <td>− 0</td>
38 | <td>+ 0</td></tr>
39 | <tr>
40 | <td>+ 0</td>
41 | <td>− 0</td></tr>
42 | <tr>
43 | <td>+ F</td>
44 | <td>− F</td></tr>
45 | <tr>
46 | <td>+ ∞</td>
47 | <td>− ∞</td></tr>
48 | <tr>
49 | <td>NaN</td>
50 | <td>NaN</td></tr></table>
51 | <p><strong>NOTES:</strong></p>
52 | <p>*</p>
53 | <p>F means finite floating-point value.</p>
54 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
55 | <h2>Operation</h2>
56 | <pre>SignBit(ST(0)) ← NOT (SignBit(ST(0)));</pre>
57 | <h2>FPU Flags Affected</h2>
58 | <table class="exception-table">
59 | <tr>
60 | <td>C1</td>
61 | <td>Set to 0.</td></tr>
62 | <tr>
63 | <td>C0, C2, C3</td>
64 | <td>Undefined.</td></tr></table>
65 | <h2>Floating-Point Exceptions</h2>
66 | <table class="exception-table">
67 | <tr>
68 | <td>#IS</td>
69 | <td>Stack underflow occurred.</td></tr></table>
70 | <h2>Protected Mode Exceptions</h2>
71 | <table class="exception-table">
72 | <tr>
73 | <td>#NM</td>
74 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
75 | <tr>
76 | <td>#UD</td>
77 | <td>If the LOCK prefix is used.</td></tr></table>
78 | <h2>Real-Address Mode Exceptions</h2>
79 | <p>Same exceptions as in protected mode.</p>
80 | <h2>Virtual-8086 Mode Exceptions</h2>
81 | <p>Same exceptions as in protected mode.</p>
82 | <h2>Compatibility Mode Exceptions</h2>
83 | <p>Same exceptions as in protected mode.</p>
84 | <h2>64-Bit Mode Exceptions</h2>
85 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FDECSTP.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>FDECSTP—Decrement Stack-Top Pointer </title></head>
 8 | <body>
 9 | <h1>FDECSTP—Decrement Stack-Top Pointer</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>D9 F6</td>
19 | <td>FDECSTP</td>
20 | <td>Valid</td>
21 | <td>Valid</td>
22 | <td>Decrement TOP field in FPU status word.</td></tr></table>
23 | <h2>Description</h2>
24 | <p>Subtracts one from the TOP field of the FPU status word (decrements the top-of-stack pointer). If the TOP field contains a 0, it is set to 7. The effect of this instruction is to rotate the stack by one position. The contents of the FPU data registers and tag register are not affected.</p>
25 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
26 | <h2>Operation</h2>
27 | <pre>IF TOP = 0
28 |     THEN TOP ← 7;
29 |     ELSE TOP ← TOP – 1;
30 | FI;</pre>
31 | <h2>FPU Flags Affected</h2>
32 | <p>The C1 flag is set to 0. The C0, C2, and C3 flags are undefined.</p>
33 | <h2>Floating-Point Exceptions</h2>
34 | <p>None.</p>
35 | <h2>Protected Mode Exceptions</h2>
36 | <table class="exception-table">
37 | <tr>
38 | <td>#NM</td>
39 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
40 | <tr>
41 | <td>#MF</td>
42 | <td>If there is a pending x87 FPU exception.</td></tr>
43 | <tr>
44 | <td>#UD</td>
45 | <td>If the LOCK prefix is used.</td></tr></table>
46 | <h2>Real-Address Mode Exceptions</h2>
47 | <p>Same exceptions as in protected mode.</p>
48 | <h2>Virtual-8086 Mode Exceptions</h2>
49 | <p>Same exceptions as in protected mode.</p>
50 | <h2>Compatibility Mode Exceptions</h2>
51 | <p>Same exceptions as in protected mode.</p>
52 | <h2>64-Bit Mode Exceptions</h2>
53 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FFREE.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>FFREE—Free Floating-Point Register </title></head>
 8 | <body>
 9 | <h1>FFREE—Free Floating-Point Register</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>DD C0+i</td>
19 | <td>FFREE ST(i)</td>
20 | <td>Valid</td>
21 | <td>Valid</td>
22 | <td>Sets tag for ST(i) to empty.</td></tr></table>
23 | <h2>Description</h2>
24 | <p>Sets the tag in the FPU tag register associated with register ST(i) to empty (11B). The contents of ST(i) and the FPU stack-top pointer (TOP) are not affected.</p>
25 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
26 | <h2>Operation</h2>
27 | <pre>TAG(i) ← 11B;</pre>
28 | <h2>FPU Flags Affected</h2>
29 | <p>C0, C1, C2, C3 undefined.</p>
30 | <h2>Floating-Point Exceptions</h2>
31 | <p>None</p>
32 | <h2>Protected Mode Exceptions</h2>
33 | <table class="exception-table">
34 | <tr>
35 | <td>#NM</td>
36 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
37 | <tr>
38 | <td>#MF</td>
39 | <td>If there is a pending x87 FPU exception.</td></tr>
40 | <tr>
41 | <td>#UD</td>
42 | <td>If the LOCK prefix is used.</td></tr></table>
43 | <h2>Real-Address Mode Exceptions</h2>
44 | <p>Same exceptions as in protected mode.</p>
45 | <h2>Virtual-8086 Mode Exceptions</h2>
46 | <p>Same exceptions as in protected mode.</p>
47 | <h2>Compatibility Mode Exceptions</h2>
48 | <p>Same exceptions as in protected mode.</p>
49 | <h2>64-Bit Mode Exceptions</h2>
50 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FINCSTP.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>FINCSTP—Increment Stack-Top Pointer </title></head>
 8 | <body>
 9 | <h1>FINCSTP—Increment Stack-Top Pointer</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>D9 F7</td>
19 | <td>FINCSTP</td>
20 | <td>Valid</td>
21 | <td>Valid</td>
22 | <td>Increment the TOP field in the FPU status register.</td></tr></table>
23 | <h2>Description</h2>
24 | <p>Adds one to the TOP field of the FPU status word (increments the top-of-stack pointer). If the TOP field contains a 7, it is set to 0. The effect of this instruction is to rotate the stack by one position. The contents of the FPU data registers and tag register are not affected. This operation is not equivalent to popping the stack, because the tag for the previous top-of-stack register is not marked empty.</p>
25 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
26 | <h2>Operation</h2>
27 | <pre>IF TOP = 7
28 |     THEN TOP ← 0;
29 |     ELSE TOP ← TOP + 1;
30 | FI;</pre>
31 | <h2>FPU Flags Affected</h2>
32 | <p>The C1 flag is set to 0. The C0, C2, and C3 flags are undefined.</p>
33 | <h2>Floating-Point Exceptions</h2>
34 | <p>None</p>
35 | <h2>Protected Mode Exceptions</h2>
36 | <table class="exception-table">
37 | <tr>
38 | <td>#NM</td>
39 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
40 | <tr>
41 | <td>#MF</td>
42 | <td>If there is a pending x87 FPU exception.</td></tr>
43 | <tr>
44 | <td>#UD</td>
45 | <td>If the LOCK prefix is used.</td></tr></table>
46 | <h2>Real-Address Mode Exceptions</h2>
47 | <p>Same exceptions as in protected mode.</p>
48 | <h2>Virtual-8086 Mode Exceptions</h2>
49 | <p>Same exceptions as in protected mode.</p>
50 | <h2>Compatibility Mode Exceptions</h2>
51 | <p>Same exceptions as in protected mode.</p>
52 | <h2>64-Bit Mode Exceptions</h2>
53 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FNOP.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>FNOP—No Operation </title></head>
 8 | <body>
 9 | <h1>FNOP—No Operation</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>D9 D0</td>
19 | <td>FNOP</td>
20 | <td>Valid</td>
21 | <td>Valid</td>
22 | <td>No operation is performed.</td></tr></table>
23 | <h2>Description</h2>
24 | <p>Performs no FPU operation. This instruction takes up space in the instruction stream but does not affect the FPU or machine context, except the EIP register and the FPU Instruction Pointer.</p>
25 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
26 | <h2>FPU Flags Affected</h2>
27 | <p>C0, C1, C2, C3 undefined.</p>
28 | <h2>Floating-Point Exceptions</h2>
29 | <p>None</p>
30 | <h2>Protected Mode Exceptions</h2>
31 | <table class="exception-table">
32 | <tr>
33 | <td>#NM</td>
34 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
35 | <tr>
36 | <td>#MF</td>
37 | <td>If there is a pending x87 FPU exception.</td></tr>
38 | <tr>
39 | <td>#UD</td>
40 | <td>If the LOCK prefix is used.</td></tr></table>
41 | <h2>Real-Address Mode Exceptions</h2>
42 | <p>Same exceptions as in protected mode.</p>
43 | <h2>Virtual-8086 Mode Exceptions</h2>
44 | <p>Same exceptions as in protected mode.</p>
45 | <h2>Compatibility Mode Exceptions</h2>
46 | <p>Same exceptions as in protected mode.</p>
47 | <h2>64-Bit Mode Exceptions</h2>
48 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FRNDINT.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>FRNDINT—Round to Integer </title></head>
 8 | <body>
 9 | <h1>FRNDINT—Round to Integer</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>D9 FC</td>
19 | <td>FRNDINT</td>
20 | <td>Valid</td>
21 | <td>Valid</td>
22 | <td>Round ST(0) to an integer.</td></tr></table>
23 | <h2>Description</h2>
24 | <p>Rounds the source value in the ST(0) register to the nearest integral value, depending on the current rounding mode (setting of the RC field of the FPU control word), and stores the result in ST(0).</p>
25 | <p>If the source value is ∞, the value is not changed. If the source value is not an integral value, the floating-point inexact-result exception (#P) is generated.</p>
26 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
27 | <h2>Operation</h2>
28 | <pre>ST(0) ← RoundToIntegralValue(ST(0));</pre>
29 | <h2>FPU Flags Affected</h2>
30 | <table class="exception-table">
31 | <tr>
32 | <td>C1</td>
33 | <td>
34 | <p>Set to 0 if stack underflow occurred.</p>
35 | <p>Set if result was rounded up; cleared otherwise.</p></td></tr>
36 | <tr>
37 | <td>C0, C2, C3</td>
38 | <td>Undefined.</td></tr></table>
39 | <h2>Floating-Point Exceptions</h2>
40 | <table class="exception-table">
41 | <tr>
42 | <td>#IS</td>
43 | <td>Stack underflow occurred.</td></tr>
44 | <tr>
45 | <td>#IA</td>
46 | <td>Source operand is an SNaN value or unsupported format.</td></tr></table>
47 | <p>#D</p>
48 | <p>Source operand is a denormal value.</p>
49 | <p>#P</p>
50 | <p>Source operand is not an integral value.</p>
51 | <h2>Protected Mode Exceptions</h2>
52 | <table class="exception-table">
53 | <tr>
54 | <td>#NM</td>
55 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
56 | <tr>
57 | <td>#MF</td>
58 | <td>If there is a pending x87 FPU exception.</td></tr>
59 | <tr>
60 | <td>#UD</td>
61 | <td>If the LOCK prefix is used.</td></tr></table>
62 | <h2>Real-Address Mode Exceptions</h2>
63 | <p>Same exceptions as in protected mode.</p>
64 | <h2>Virtual-8086 Mode Exceptions</h2>
65 | <p>Same exceptions as in protected mode.</p>
66 | <h2>Compatibility Mode Exceptions</h2>
67 | <p>Same exceptions as in protected mode.</p>
68 | <h2>64-Bit Mode Exceptions</h2>
69 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FSQRT.html:
--------------------------------------------------------------------------------
  1 | <!DOCTYPE html>
  2 | 
  3 | <html>
  4 | <head>
  5 | <meta charset="UTF-8">
  6 | <link href="style.css" type="text/css" rel="stylesheet">
  7 | <title>FSQRT—Square Root </title></head>
  8 | <body>
  9 | <h1>FSQRT—Square Root</h1>
 10 | <table>
 11 | <tr>
 12 | <th>Opcode</th>
 13 | <th>Instruction</th>
 14 | <th>64-Bit Mode</th>
 15 | <th>Compat/Leg Mode</th>
 16 | <th>Description</th></tr>
 17 | <tr>
 18 | <td>D9 FA</td>
 19 | <td>FSQRT</td>
 20 | <td>Valid</td>
 21 | <td>Valid</td>
 22 | <td>Computes square root of ST(0) and stores the result in ST(0).</td></tr></table>
 23 | <h2>Description</h2>
 24 | <p>Computes the square root of the source value in the ST(0) register and stores the result in ST(0).</p>
 25 | <p>The following table shows the results obtained when taking the square root of various classes of numbers, assuming that neither overflow nor underflow occurs.</p>
 26 | <h3>Table 3-37.  FSQRT Results</h3>
 27 | <table>
 28 | <tr>
 29 | <th>SRC (ST(0))</th>
 30 | <th>DEST (ST(0))</th></tr>
 31 | <tr>
 32 | <td>− ∞</td>
 33 | <td>*</td></tr>
 34 | <tr>
 35 | <td>− F</td>
 36 | <td>*</td></tr>
 37 | <tr>
 38 | <td>− 0</td>
 39 | <td>− 0</td></tr>
 40 | <tr>
 41 | <td>+ 0</td>
 42 | <td>+ 0</td></tr>
 43 | <tr>
 44 | <td>+ F</td>
 45 | <td>+ F</td></tr>
 46 | <tr>
 47 | <td>+ ∞</td>
 48 | <td>+ ∞</td></tr>
 49 | <tr>
 50 | <td>NaN</td>
 51 | <td>NaN</td></tr></table>
 52 | <p><strong>NOTES:</strong></p>
 53 | <p>F Means finite floating-point value.</p>
 54 | <p>*</p>
 55 | <p>Indicates floating-point invalid-arithmetic-operand (#IA) exception.</p>
 56 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
 57 | <h2>Operation</h2>
 58 | <pre>ST(0) ← SquareRoot(ST(0));</pre>
 59 | <h2>FPU Flags Affected</h2>
 60 | <table class="exception-table">
 61 | <tr>
 62 | <td>C1</td>
 63 | <td>
 64 | <p>Set to 0 if stack underflow occurred.</p>
 65 | <p>Set if result was rounded up; cleared otherwise.</p></td></tr>
 66 | <tr>
 67 | <td>C0, C2, C3</td>
 68 | <td>Undefined.</td></tr></table>
 69 | <h2>Floating-Point Exceptions</h2>
 70 | <table class="exception-table">
 71 | <tr>
 72 | <td>#IS</td>
 73 | <td>Stack underflow occurred.</td></tr>
 74 | <tr>
 75 | <td>#IA</td>
 76 | <td>
 77 | <p>Source operand is an SNaN value or unsupported format.</p>
 78 | <p>Source operand is a negative value (except for −0).</p></td></tr></table>
 79 | <p>#D</p>
 80 | <p>Source operand is a denormal value.</p>
 81 | <p>#P</p>
 82 | <p>Value cannot be represented exactly in destination format.</p>
 83 | <h2>Protected Mode Exceptions</h2>
 84 | <table class="exception-table">
 85 | <tr>
 86 | <td>#NM</td>
 87 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
 88 | <tr>
 89 | <td>#MF</td>
 90 | <td>If there is a pending x87 FPU exception.</td></tr>
 91 | <tr>
 92 | <td>#UD</td>
 93 | <td>If the LOCK prefix is used.</td></tr></table>
 94 | <h2>Real-Address Mode Exceptions</h2>
 95 | <p>Same exceptions as in protected mode.</p>
 96 | <h2>Virtual-8086 Mode Exceptions</h2>
 97 | <p>Same exceptions as in protected mode.</p>
 98 | <h2>Compatibility Mode Exceptions</h2>
 99 | <p>Same exceptions as in protected mode.</p>
100 | <h2>64-Bit Mode Exceptions</h2>
101 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FXAM.html:
--------------------------------------------------------------------------------
  1 | <!DOCTYPE html>
  2 | 
  3 | <html>
  4 | <head>
  5 | <meta charset="UTF-8">
  6 | <link href="style.css" type="text/css" rel="stylesheet">
  7 | <title>FXAM—Examine Floating-Point </title></head>
  8 | <body>
  9 | <h1>FXAM—Examine Floating-Point</h1>
 10 | <table>
 11 | <tr>
 12 | <th>Opcode</th>
 13 | <th>Instruction</th>
 14 | <th>64-Bit Mode</th>
 15 | <th>Compat/Leg Mode</th>
 16 | <th>Description</th></tr>
 17 | <tr>
 18 | <td>D9 E5</td>
 19 | <td>FXAM</td>
 20 | <td>Valid</td>
 21 | <td>Valid</td>
 22 | <td>Classify value or number in ST(0).</td></tr></table>
 23 | <h2>Description</h2>
 24 | <p>Examines the contents of the ST(0) register and sets the condition code flags C0, C2, and C3 in the FPU status word to indicate the class of value or number in the register (see the table below).</p>
 25 | <h3>Table 3-42.  FXAM Results</h3>
 26 | <p>.</p>
 27 | <table>
 28 | <tr>
 29 | <th>Class</th>
 30 | <th>C3</th>
 31 | <th>C2</th>
 32 | <th>C0</th></tr>
 33 | <tr>
 34 | <td>Unsupported</td>
 35 | <td>0</td>
 36 | <td>0</td>
 37 | <td>0</td></tr>
 38 | <tr>
 39 | <td>NaN</td>
 40 | <td>0</td>
 41 | <td>0</td>
 42 | <td>1</td></tr>
 43 | <tr>
 44 | <td>Normal finite number</td>
 45 | <td>0</td>
 46 | <td>1</td>
 47 | <td>0</td></tr>
 48 | <tr>
 49 | <td>Infinity</td>
 50 | <td>0</td>
 51 | <td>1</td>
 52 | <td>1</td></tr>
 53 | <tr>
 54 | <td>Zero</td>
 55 | <td>1</td>
 56 | <td>0</td>
 57 | <td>0</td></tr>
 58 | <tr>
 59 | <td>Empty</td>
 60 | <td>1</td>
 61 | <td>0</td>
 62 | <td>1</td></tr>
 63 | <tr>
 64 | <td>Denormal number</td>
 65 | <td>1</td>
 66 | <td>1</td>
 67 | <td>0</td></tr></table>
 68 | <p>The C1 flag is set to the sign of the value in ST(0), regardless of whether the register is empty or full.</p>
 69 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
 70 | <h2>Operation</h2>
 71 | <pre>C1 ← sign bit of ST; (* 0 for positive, 1 for negative *)
 72 | CASE (class of value or number in ST(0)) OF
 73 |     Unsupported:C3, C2, C0 ← 000;
 74 |     NaN:
 75 |                     C3, C2, C0 ← 001;
 76 |     Normal:
 77 |                     C3, C2, C0 ← 010;
 78 |     Infinity:
 79 |                     C3, C2, C0 ← 011;
 80 |     Zero:
 81 |                     C3, C2, C0 ← 100;
 82 |     Empty:
 83 |                     C3, C2, C0 ← 101;
 84 |     Denormal:
 85 |                     C3, C2, C0 ← 110;
 86 | ESAC;</pre>
 87 | <h2>FPU Flags Affected</h2>
 88 | <table class="exception-table">
 89 | <tr>
 90 | <td>C1</td>
 91 | <td>Sign of value in ST(0).</td></tr>
 92 | <tr>
 93 | <td>C0, C2, C3</td>
 94 | <td>See Table 3-42.</td></tr></table>
 95 | <h2>Floating-Point Exceptions</h2>
 96 | <p>None</p>
 97 | <h2>Protected Mode Exceptions</h2>
 98 | <table class="exception-table">
 99 | <tr>
100 | <td>#NM</td>
101 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
102 | <tr>
103 | <td>#MF</td>
104 | <td>If there is a pending x87 FPU exception.</td></tr>
105 | <tr>
106 | <td>#UD</td>
107 | <td>If the LOCK prefix is used.</td></tr></table>
108 | <h2>Real-Address Mode Exceptions</h2>
109 | <p>Same exceptions as in protected mode.</p>
110 | <h2>Virtual-8086 Mode Exceptions</h2>
111 | <p>Same exceptions as in protected mode.</p>
112 | <h2>Compatibility Mode Exceptions</h2>
113 | <p>Same exceptions as in protected mode.</p>
114 | <h2>64-Bit Mode Exceptions</h2>
115 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/FXCH.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>FXCH—Exchange Register Contents </title></head>
 8 | <body>
 9 | <h1>FXCH—Exchange Register Contents</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>D9 C8+i</td>
19 | <td>FXCH ST(i)</td>
20 | <td>Valid</td>
21 | <td>Valid</td>
22 | <td>Exchange the contents of ST(0) and ST(i).</td></tr>
23 | <tr>
24 | <td>D9 C9</td>
25 | <td>FXCH</td>
26 | <td>Valid</td>
27 | <td>Valid</td>
28 | <td>Exchange the contents of ST(0) and ST(1).</td></tr></table>
29 | <h2>Description</h2>
30 | <p>Exchanges the contents of registers ST(0) and ST(i). If no source operand is specified, the contents of ST(0) and ST(1) are exchanged.</p>
31 | <p>This instruction provides a simple means of moving values in the FPU register stack to the top of the stack [ST(0)], so that they can be operated on by those floating-point instructions that can only operate on values in ST(0). For example, the following instruction sequence takes the square root of the third register from the top of the register stack:</p>
32 | <p>FXCH ST(3);</p>
33 | <p>FSQRT;</p>
34 | <p>FXCH ST(3);</p>
35 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
36 | <h2>Operation</h2>
37 | <pre>IF (Number-of-operands) is 1
38 |     THEN
39 |          temp ← ST(0);
40 |          ST(0) ← SRC;
41 |          SRC ← temp;
42 |     ELSE
43 |          temp ← ST(0);
44 |          ST(0) ← ST(1);
45 |          ST(1) ← temp;
46 | FI;</pre>
47 | <h2>FPU Flags Affected</h2>
48 | <table class="exception-table">
49 | <tr>
50 | <td>C1</td>
51 | <td>Set to 0.</td></tr>
52 | <tr>
53 | <td>C0, C2, C3</td>
54 | <td>Undefined.</td></tr></table>
55 | <h2>Floating-Point Exceptions</h2>
56 | <table class="exception-table">
57 | <tr>
58 | <td>#IS</td>
59 | <td>Stack underflow occurred.</td></tr></table>
60 | <h2>Protected Mode Exceptions</h2>
61 | <table class="exception-table">
62 | <tr>
63 | <td>#NM</td>
64 | <td>CR0.EM[bit 2] or CR0.TS[bit 3] = 1.</td></tr>
65 | <tr>
66 | <td>#MF</td>
67 | <td>If there is a pending x87 FPU exception.</td></tr>
68 | <tr>
69 | <td>#UD</td>
70 | <td>If the LOCK prefix is used.</td></tr></table>
71 | <h2>Real-Address Mode Exceptions</h2>
72 | <p>Same exceptions as in protected mode.</p>
73 | <h2>Virtual-8086 Mode Exceptions</h2>
74 | <p>Same exceptions as in protected mode.</p>
75 | <h2>Compatibility Mode Exceptions</h2>
76 | <p>Same exceptions as in protected mode.</p>
77 | <h2>64-Bit Mode Exceptions</h2>
78 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/HLT.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>HLT—Halt </title></head>
 8 | <body>
 9 | <h1>HLT—Halt</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>F4</td>
20 | <td>HLT</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Halt</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Stops instruction execution and places the processor in a HALT state. An enabled interrupt (including NMI and SMI), a debug exception, the BINIT# signal, the INIT# signal, or the RESET# signal will resume execution. If an interrupt (including NMI) is used to resume execution after a HLT instruction, the saved instruction pointer (CS:EIP) points to the instruction following the HLT instruction.</p>
41 | <p>When a HLT instruction is executed on an Intel 64 or IA-32 processor supporting Intel Hyper-Threading Technology, only the logical processor that executes the instruction is halted. The other logical processors in the physical processor remain active, unless they are each individually halted by executing a HLT instruction.</p>
42 | <p>The HLT instruction is a privileged instruction. When the processor is running in protected or virtual-8086 mode, the privilege level of a program or procedure must be 0 to execute the HLT instruction.</p>
43 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
44 | <h2>Operation</h2>
45 | <pre>Enter Halt state;</pre>
46 | <h2>Flags Affected</h2>
47 | <p>None</p>
48 | <h2>Protected Mode Exceptions</h2>
49 | <table class="exception-table">
50 | <tr>
51 | <td>#GP(0)</td>
52 | <td>If the current privilege level is not 0.</td></tr>
53 | <tr>
54 | <td>#UD</td>
55 | <td>If the LOCK prefix is used.</td></tr></table>
56 | <h2>Real-Address Mode Exceptions</h2>
57 | <p>None.</p>
58 | <h2>Virtual-8086 Mode Exceptions</h2>
59 | <p>Same exceptions as in protected mode.</p>
60 | <h2>Compatibility Mode Exceptions</h2>
61 | <p>Same exceptions as in protected mode.</p>
62 | <h2>64-Bit Mode Exceptions</h2>
63 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/KADDW_KADDB_KADDQ_KADDD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KADDW/KADDB/KADDQ/KADDD—ADD Two Masks </title></head>
 8 | <body>
 9 | <h1>KADDW/KADDB/KADDQ/KADDD—ADD Two Masks</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.L1.0F.W0 4A /r KADDW k1, k2, k3</td>
19 | <td>RVR</td>
20 | <td>V/V</td>
21 | <td>AVX512DQ</td>
22 | <td>Add 16 bits masks in k2 and k3 and place result in k1.</td></tr>
23 | <tr>
24 | <td>VEX.L1.66.0F.W0 4A /r KADDB k1, k2, k3</td>
25 | <td>RVR</td>
26 | <td>V/V</td>
27 | <td>AVX512DQ</td>
28 | <td>Add 8 bits masks in k2 and k3 and place result in k1.</td></tr>
29 | <tr>
30 | <td>VEX.L1.0F.W1 4A /r KADDQ k1, k2, k3</td>
31 | <td>RVR</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Add 64 bits masks in k2 and k3 and place result in k1.</td></tr>
35 | <tr>
36 | <td>VEX.L1.66.0F.W1 4A /r KADDD k1, k2, k3</td>
37 | <td>RVR</td>
38 | <td>V/V</td>
39 | <td>AVX512BW</td>
40 | <td>Add 32 bits masks in k2 and k3 and place result in k1.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <p>Op/En</p>
43 | <p>Operand 1</p>
44 | <p>Operand 2</p>
45 | <p>Operand 3</p>
46 | <p>RVR</p>
47 | <p>ModRM:reg (w)</p>
48 | <p>VEX.1vvv (r)</p>
49 | <p>ModRM:r/m (r, ModRM:[7:6] must be 11b)</p>
50 | <h2>Description</h2>
51 | <p>Adds the vector mask k2 and the vector mask k3, and writes the result into vector mask k1.</p>
52 | <h2>Operation</h2>
53 | <p><strong>KADDW</strong></p>
54 | <pre>DEST[15:0] (cid:197) SRC1[15:0] + SRC2[15:0]
55 | DEST[MAX_KL-1:16] (cid:197) 0</pre>
56 | <p><strong>KADDB</strong></p>
57 | <pre>DEST[7:0] (cid:197) SRC1[7:0] + SRC2[7:0]
58 | DEST[MAX_KL-1:8] (cid:197) 0</pre>
59 | <p><strong>KADDQ</strong></p>
60 | <pre>DEST[63:0] (cid:197) SRC1[63:0] + SRC2[63:0]
61 | DEST[MAX_KL-1:64] (cid:197) 0</pre>
62 | <p><strong>KADDD</strong></p>
63 | <pre>DEST[31:0] (cid:197) SRC1[31:0] + SRC2[31:0]
64 | DEST[MAX_KL-1:32] (cid:197) 0</pre>
65 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
66 | <h2>SIMD Floating-Point Exceptions</h2>
67 | <p>None</p>
68 | <h2>Other Exceptions</h2>
69 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/KANDNW_KANDNB_KANDNQ_KANDND.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KANDNW/KANDNB/KANDNQ/KANDND—Bitwise Logical AND NOT Masks </title></head>
 8 | <body>
 9 | <h1>KANDNW/KANDNB/KANDNQ/KANDND—Bitwise Logical AND NOT Masks</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDS.L1.0F.W0 42 /r KANDNW k1, k2, k3</td>
19 | <td>RVR</td>
20 | <td>V/V</td>
21 | <td>AVX512F</td>
22 | <td>Bitwise AND NOT 16 bits masks k2 and k3 and place result in k1.</td></tr>
23 | <tr>
24 | <td>VEX.L1.66.0F.W0 42 /r KANDNB k1, k2, k3</td>
25 | <td>RVR</td>
26 | <td>V/V</td>
27 | <td>AVX512DQ</td>
28 | <td>Bitwise AND NOT 8 bits masks k1 and k2 and place result in k1.</td></tr>
29 | <tr>
30 | <td>VEX.L1.0F.W1 42 /r KANDNQ k1, k2, k3</td>
31 | <td>RVR</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Bitwise AND NOT 64 bits masks k2 and k3 and place result in k1.</td></tr>
35 | <tr>
36 | <td>VEX.L1.66.0F.W1 42 /r KANDND k1, k2, k3</td>
37 | <td>RVR</td>
38 | <td>V/V</td>
39 | <td>AVX512BW</td>
40 | <td>Bitwise AND NOT 32 bits masks k2 and k3 and place result in k1.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <table>
43 | <tr>
44 | <td>Op/En</td>
45 | <td>Operand 1</td>
46 | <td>Operand 2</td>
47 | <td>Operand 3</td></tr>
48 | <tr>
49 | <td>RVR</td>
50 | <td>ModRM:reg (w)</td>
51 | <td>VEX.1vvv (r)</td>
52 | <td>ModRM:r/m (r, ModRM:[7:6] must be 11b)</td></tr></table>
53 | <h2>Description</h2>
54 | <p>Performs a bitwise AND NOT between the vector mask k2 and the vector mask k3, and writes the result into vector mask k1.</p>
55 | <h2>Operation</h2>
56 | <p><strong>KANDNW</strong></p>
57 | <pre>DEST[15:0] (cid:197) (BITWISE NOT SRC1[15:0]) BITWISE AND SRC2[15:0]
58 | DEST[MAX_KL-1:16] (cid:197) 0</pre>
59 | <p><strong>KANDNB</strong></p>
60 | <pre>DEST[7:0] (cid:197) (BITWISE NOT SRC1[7:0]) BITWISE AND SRC2[7:0]
61 | DEST[MAX_KL-1:8] (cid:197) 0</pre>
62 | <p><strong>KANDNQ</strong></p>
63 | <pre>DEST[63:0] (cid:197) (BITWISE NOT SRC1[63:0]) BITWISE AND SRC2[63:0]
64 | DEST[MAX_KL-1:64] (cid:197) 0</pre>
65 | <p><strong>KANDND</strong></p>
66 | <pre>DEST[31:0] (cid:197) (BITWISE NOT SRC1[31:0]) BITWISE AND SRC2[31:0]
67 | DEST[MAX_KL-1:32] (cid:197) 0</pre>
68 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
69 | <p>KANDNW __mmask16 _mm512_kandn(__mmask16 a, __mmask16 b);</p>
70 | <h2>Flags Affected</h2>
71 | <p>None</p>
72 | <h2>SIMD Floating-Point Exceptions</h2>
73 | <p>None</p>
74 | <h2>Other Exceptions</h2>
75 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/KANDW_KANDB_KANDQ_KANDD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KANDW/KANDB/KANDQ/KANDD—Bitwise Logical AND Masks </title></head>
 8 | <body>
 9 | <h1>KANDW/KANDB/KANDQ/KANDD—Bitwise Logical AND Masks</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDS.L1.0F.W0 41 /r KANDW k1, k2, k3</td>
19 | <td>RVR</td>
20 | <td>V/V</td>
21 | <td>AVX512F</td>
22 | <td>Bitwise AND 16 bits masks k2 and k3 and place result in k1.</td></tr>
23 | <tr>
24 | <td>VEX.L1.66.0F.W0 41 /r KANDB k1, k2, k3</td>
25 | <td>RVR</td>
26 | <td>V/V</td>
27 | <td>AVX512DQ</td>
28 | <td>Bitwise AND 8 bits masks k2 and k3 and place result in k1.</td></tr>
29 | <tr>
30 | <td>VEX.L1.0F.W1 41 /r KANDQ k1, k2, k3</td>
31 | <td>RVR</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Bitwise AND 64 bits masks k2 and k3 and place result in k1.</td></tr>
35 | <tr>
36 | <td>VEX.L1.66.0F.W1 41 /r KANDD k1, k2, k3</td>
37 | <td>RVR</td>
38 | <td>V/V</td>
39 | <td>AVX512BW</td>
40 | <td>Bitwise AND 32 bits masks k2 and k3 and place result in k1.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <table>
43 | <tr>
44 | <td>Op/En</td>
45 | <td>Operand 1</td>
46 | <td>Operand 2</td>
47 | <td>Operand 3</td></tr>
48 | <tr>
49 | <td>RVR</td>
50 | <td>ModRM:reg (w)</td>
51 | <td>VEX.1vvv (r)</td>
52 | <td>ModRM:r/m (r, ModRM:[7:6] must be 11b)</td></tr></table>
53 | <h2>Description</h2>
54 | <p>Performs a bitwise AND between the vector mask k2 and the vector mask k3, and writes the result into vector mask k1.</p>
55 | <h2>Operation</h2>
56 | <p><strong>KANDW</strong></p>
57 | <pre>DEST[15:0] (cid:197) SRC1[15:0] BITWISE AND SRC2[15:0]
58 | DEST[MAX_KL-1:16] (cid:197) 0</pre>
59 | <p><strong>KANDB</strong></p>
60 | <pre>DEST[7:0] (cid:197) SRC1[7:0] BITWISE AND SRC2[7:0]
61 | DEST[MAX_KL-1:8] (cid:197) 0</pre>
62 | <p><strong>KANDQ</strong></p>
63 | <pre>DEST[63:0] (cid:197) SRC1[63:0] BITWISE AND SRC2[63:0]
64 | DEST[MAX_KL-1:64] (cid:197) 0</pre>
65 | <p><strong>KANDD</strong></p>
66 | <pre>DEST[31:0] (cid:197) SRC1[31:0] BITWISE AND SRC2[31:0]
67 | DEST[MAX_KL-1:32] (cid:197) 0</pre>
68 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
69 | <p>KANDW __mmask16 _mm512_kand(__mmask16 a, __mmask16 b);</p>
70 | <h2>Flags Affected</h2>
71 | <p>None</p>
72 | <h2>SIMD Floating-Point Exceptions</h2>
73 | <p>None</p>
74 | <h2>Other Exceptions</h2>
75 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/KNOTW_KNOTB_KNOTQ_KNOTD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KNOTW/KNOTB/KNOTQ/KNOTD—NOT Mask Register </title></head>
 8 | <body>
 9 | <h1>KNOTW/KNOTB/KNOTQ/KNOTD—NOT Mask Register</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.L0.0F.W0 44 /r KNOTW k1, k2</td>
19 | <td>RR</td>
20 | <td>V/V</td>
21 | <td>AVX512F</td>
22 | <td>Bitwise NOT of 16 bits mask k2.</td></tr>
23 | <tr>
24 | <td>VEX.L0.66.0F.W0 44 /r KNOTB k1, k2</td>
25 | <td>RR</td>
26 | <td>V/V</td>
27 | <td>AVX512DQ</td>
28 | <td>Bitwise NOT of 8 bits mask k2.</td></tr>
29 | <tr>
30 | <td>VEX.L0.0F.W1 44 /r KNOTQ k1, k2</td>
31 | <td>RR</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Bitwise NOT of 64 bits mask k2.</td></tr>
35 | <tr>
36 | <td>VEX.L0.66.0F.W1 44 /r KNOTD k1, k2</td>
37 | <td>RR</td>
38 | <td>V/V</td>
39 | <td>AVX512BW</td>
40 | <td>Bitwise NOT of 32 bits mask k2.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <table>
43 | <tr>
44 | <td>Op/En</td>
45 | <td>Operand 1</td>
46 | <td>Operand 2</td></tr>
47 | <tr>
48 | <td>RR</td>
49 | <td>ModRM:reg (w)</td>
50 | <td>ModRM:r/m (r, ModRM:[7:6] must be 11b)</td></tr></table>
51 | <h2>Description</h2>
52 | <p>Performs a bitwise NOT of vector mask k2 and writes the result into vector mask k1.</p>
53 | <h2>Operation</h2>
54 | <p><strong>KNOTW</strong></p>
55 | <pre>DEST[15:0] (cid:197) BITWISE NOT SRC[15:0]
56 | DEST[MAX_KL-1:16] (cid:197) 0</pre>
57 | <p><strong>KNOTB</strong></p>
58 | <pre>DEST[7:0] (cid:197) BITWISE NOT SRC[7:0]
59 | DEST[MAX_KL-1:8] (cid:197) 0</pre>
60 | <p><strong>KNOTQ</strong></p>
61 | <pre>DEST[63:0] (cid:197) BITWISE NOT SRC[63:0]
62 | DEST[MAX_KL-1:64] (cid:197) 0</pre>
63 | <p><strong>KNOTD</strong></p>
64 | <pre>DEST[31:0] (cid:197) BITWISE NOT SRC[31:0]
65 | DEST[MAX_KL-1:32] (cid:197) 0</pre>
66 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
67 | <p>KNOTW __mmask16 _mm512_knot(__mmask16 a);</p>
68 | <h2>Flags Affected</h2>
69 | <p>None</p>
70 | <h2>SIMD Floating-Point Exceptions</h2>
71 | <p>None</p>
72 | <h2>Other Exceptions</h2>
73 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/KORW_KORB_KORQ_KORD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KORW/KORB/KORQ/KORD—Bitwise Logical OR Masks </title></head>
 8 | <body>
 9 | <h1>KORW/KORB/KORQ/KORD—Bitwise Logical OR Masks</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDS.L1.0F.W0 45 /r KORW k1, k2, k3</td>
19 | <td>RVR</td>
20 | <td>V/V</td>
21 | <td>AVX512F</td>
22 | <td>Bitwise OR 16 bits masks k2 and k3 and place result in k1.</td></tr>
23 | <tr>
24 | <td>VEX.L1.66.0F.W0 45 /r KORB k1, k2, k3</td>
25 | <td>RVR</td>
26 | <td>V/V</td>
27 | <td>AVX512DQ</td>
28 | <td>Bitwise OR 8 bits masks k2 and k3 and place result in k1.</td></tr>
29 | <tr>
30 | <td>VEX.L1.0F.W1 45 /r KORQ k1, k2, k3</td>
31 | <td>RVR</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Bitwise OR 64 bits masks k2 and k3 and place result in k1.</td></tr>
35 | <tr>
36 | <td>VEX.L1.66.0F.W1 45 /r KORD k1, k2, k3</td>
37 | <td>RVR</td>
38 | <td>V/V</td>
39 | <td>AVX512BW</td>
40 | <td>Bitwise OR 32 bits masks k2 and k3 and place result in k1.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <table>
43 | <tr>
44 | <td>Op/En</td>
45 | <td>Operand 1</td>
46 | <td>Operand 2</td>
47 | <td>Operand 3</td></tr>
48 | <tr>
49 | <td>RVR</td>
50 | <td>ModRM:reg (w)</td>
51 | <td>VEX.1vvv (r)</td>
52 | <td>ModRM:r/m (r, ModRM:[7:6] must be 11b)</td></tr></table>
53 | <h2>Description</h2>
54 | <p>Performs a bitwise OR between the vector mask k2 and the vector mask k3, and writes the result into vector mask k1 (three-operand form).</p>
55 | <h2>Operation</h2>
56 | <p><strong>KORW</strong></p>
57 | <pre>DEST[15:0] (cid:197) SRC1[15:0] BITWISE OR SRC2[15:0]
58 | DEST[MAX_KL-1:16] (cid:197) 0</pre>
59 | <p><strong>KORB</strong></p>
60 | <pre>DEST[7:0] (cid:197) SRC1[7:0] BITWISE OR SRC2[7:0]
61 | DEST[MAX_KL-1:8] (cid:197) 0</pre>
62 | <p><strong>KORQ</strong></p>
63 | <pre>DEST[63:0] (cid:197) SRC1[63:0] BITWISE OR SRC2[63:0]
64 | DEST[MAX_KL-1:64] (cid:197) 0</pre>
65 | <p><strong>KORD</strong></p>
66 | <pre>DEST[31:0] (cid:197) SRC1[31:0] BITWISE OR SRC2[31:0]
67 | DEST[MAX_KL-1:32] (cid:197) 0</pre>
68 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
69 | <p>KORW __mmask16 _mm512_kor(__mmask16 a, __mmask16 b);</p>
70 | <h2>Flags Affected</h2>
71 | <p>None</p>
72 | <h2>SIMD Floating-Point Exceptions</h2>
73 | <p>None</p>
74 | <h2>Other Exceptions</h2>
75 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/KSHIFTLW_KSHIFTLB_KSHIFTLQ_KSHIFTLD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KSHIFTLW/KSHIFTLB/KSHIFTLQ/KSHIFTLD—Shift Left Mask Registers </title></head>
 8 | <body>
 9 | <h1>KSHIFTLW/KSHIFTLB/KSHIFTLQ/KSHIFTLD—Shift Left Mask Registers</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.L0.66.0F3A.W1 32 /r KSHIFTLW k1, k2, imm8</td>
19 | <td>RRI</td>
20 | <td>V/V</td>
21 | <td>AVX512F</td>
22 | <td>Shift left 16 bits in k2 by immediate and write result in k1.</td></tr>
23 | <tr>
24 | <td>VEX.L0.66.0F3A.W0 32 /r KSHIFTLB k1, k2, imm8</td>
25 | <td>RRI</td>
26 | <td>V/V</td>
27 | <td>AVX512DQ</td>
28 | <td>Shift left 8 bits in k2 by immediate and write result in k1.</td></tr>
29 | <tr>
30 | <td>VEX.L0.66.0F3A.W1 33 /r KSHIFTLQ k1, k2, imm8</td>
31 | <td>RRI</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Shift left 64 bits in k2 by immediate and write result in k1.</td></tr>
35 | <tr>
36 | <td>VEX.L0.66.0F3A.W0 33 /r KSHIFTLD k1, k2, imm8</td>
37 | <td>RRI</td>
38 | <td>V/V</td>
39 | <td>AVX512BW</td>
40 | <td>Shift left 32 bits in k2 by immediate and write result in k1.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <table>
43 | <tr>
44 | <td>Op/En</td>
45 | <td>Operand 1</td>
46 | <td>Operand 2</td>
47 | <td>Operand 3</td></tr>
48 | <tr>
49 | <td>RRI</td>
50 | <td>ModRM:reg (w)</td>
51 | <td>ModRM:r/m (r, ModRM:[7:6] must be 11b)</td>
52 | <td>Imm8</td></tr></table>
53 | <h2>Description</h2>
54 | <p>Shifts 8/16/32/64 bits in the second operand (source operand) left by the count specified in immediate byte and place the least significant 8/16/32/64 bits of the result in the destination operand. The higher bits of the destination are zero-extended. The destination is set to zero if the count value is greater than 7 (for byte shift), 15 (for word shift), 31 (for doubleword shift) or 63 (for quadword shift).</p>
55 | <h2>Operation</h2>
56 | <p><strong>KSHIFTLW</strong></p>
57 | <pre>COUNT (cid:197) imm8[7:0]
58 | DEST[MAX_KL-1:0] (cid:197) 0
59 | IF COUNT &lt;=15
60 |     THEN DEST[15:0] (cid:197) SRC1[15:0] &lt;&lt; COUNT;
61 | FI;</pre>
62 | <p><strong>KSHIFTLB</strong></p>
63 | <pre>COUNT (cid:197) imm8[7:0]
64 | DEST[MAX_KL-1:0] (cid:197) 0
65 | IF COUNT &lt;=7
66 |           THEN
67 |                      DEST[7:0] (cid:197) SRC1[7:0] &lt;&lt; COUNT;
68 | FI;</pre>
69 | <p><strong>KSHIFTLQ</strong></p>
70 | <pre>COUNT (cid:197) imm8[7:0]
71 | DEST[MAX_KL-1:0] (cid:197) 0
72 | IF COUNT &lt;=63
73 |           THEN
74 |                      DEST[63:0] (cid:197) SRC1[63:0] &lt;&lt; COUNT;
75 | FI;</pre>
76 | <p><strong>KSHIFTLD</strong></p>
77 | <pre>COUNT (cid:197) imm8[7:0]
78 | DEST[MAX_KL-1:0] (cid:197) 0
79 | IF COUNT &lt;=31
80 |           THEN
81 |                      DEST[31:0] (cid:197) SRC1[31:0] &lt;&lt; COUNT;
82 | FI;</pre>
83 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
84 | <p>Compiler auto generates KSHIFTLW when needed.</p>
85 | <h2>Flags Affected</h2>
86 | <p>None</p>
87 | <h2>SIMD Floating-Point Exceptions</h2>
88 | <p>None</p>
89 | <h2>Other Exceptions</h2>
90 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/KSHIFTRW_KSHIFTRB_KSHIFTRQ_KSHIFTRD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KSHIFTRW/KSHIFTRB/KSHIFTRQ/KSHIFTRD—Shift Right Mask Registers </title></head>
 8 | <body>
 9 | <h1>KSHIFTRW/KSHIFTRB/KSHIFTRQ/KSHIFTRD—Shift Right Mask Registers</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.L0.66.0F3A.W1 30 /r KSHIFTRW k1, k2, imm8</td>
19 | <td>RRI</td>
20 | <td>V/V</td>
21 | <td>AVX512F</td>
22 | <td>Shift right 16 bits in k2 by immediate and write result in k1.</td></tr>
23 | <tr>
24 | <td>VEX.L0.66.0F3A.W0 30 /r KSHIFTRB k1, k2, imm8</td>
25 | <td>RRI</td>
26 | <td>V/V</td>
27 | <td>AVX512DQ</td>
28 | <td>Shift right 8 bits in k2 by immediate and write result in k1.</td></tr>
29 | <tr>
30 | <td>VEX.L0.66.0F3A.W1 31 /r KSHIFTRQ k1, k2, imm8</td>
31 | <td>RRI</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Shift right 64 bits in k2 by immediate and write result in k1.</td></tr>
35 | <tr>
36 | <td>VEX.L0.66.0F3A.W0 31 /r KSHIFTRD k1, k2, imm8</td>
37 | <td>RRI</td>
38 | <td>V/V</td>
39 | <td>AVX512BW</td>
40 | <td>Shift right 32 bits in k2 by immediate and write result in k1.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <table>
43 | <tr>
44 | <td>Op/En</td>
45 | <td>Operand 1</td>
46 | <td>Operand 2</td>
47 | <td>Operand 3</td></tr>
48 | <tr>
49 | <td>RRI</td>
50 | <td>ModRM:reg (w)</td>
51 | <td>ModRM:r/m (r, ModRM:[7:6] must be 11b)</td>
52 | <td>Imm8</td></tr></table>
53 | <h2>Description</h2>
54 | <p>Shifts 8/16/32/64 bits in the second operand (source operand) right by the count specified in immediate and place the least significant 8/16/32/64 bits of the result in the destination operand. The higher bits of the destination are zero-extended. The destination is set to zero if the count value is greater than 7 (for byte shift), 15 (for word shift), 31 (for doubleword shift) or 63 (for quadword shift).</p>
55 | <h2>Operation</h2>
56 | <p><strong>KSHIFTRW</strong></p>
57 | <pre>COUNT (cid:197) imm8[7:0]
58 | DEST[MAX_KL-1:0] (cid:197) 0
59 | IF COUNT &lt;=15
60 |     THEN DEST[15:0] (cid:197) SRC1[15:0] &gt;&gt; COUNT;
61 | FI;</pre>
62 | <p><strong>KSHIFTRB</strong></p>
63 | <pre>COUNT (cid:197) imm8[7:0]
64 | DEST[MAX_KL-1:0] (cid:197) 0
65 | IF COUNT &lt;=7
66 |           THEN
67 |                      DEST[7:0] (cid:197) SRC1[7:0] &gt;&gt; COUNT;
68 | FI;</pre>
69 | <p><strong>KSHIFTRQ</strong></p>
70 | <pre>COUNT (cid:197) imm8[7:0]
71 | DEST[MAX_KL-1:0] (cid:197) 0
72 | IF COUNT &lt;=63
73 |           THEN
74 |                      DEST[63:0] (cid:197) SRC1[63:0] &gt;&gt; COUNT;
75 | FI;</pre>
76 | <p><strong>KSHIFTRD</strong></p>
77 | <pre>COUNT (cid:197) imm8[7:0]
78 | DEST[MAX_KL-1:0] (cid:197) 0
79 | IF COUNT &lt;=31
80 |           THEN
81 |                      DEST[31:0] (cid:197) SRC1[31:0] &gt;&gt; COUNT;
82 | FI;</pre>
83 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
84 | <p>Compiler auto generates KSHIFTRW when needed.</p>
85 | <h2>Flags Affected</h2>
86 | <p>None</p>
87 | <h2>SIMD Floating-Point Exceptions</h2>
88 | <p>None</p>
89 | <h2>Other Exceptions</h2>
90 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/KUNPCKBW_KUNPCKWD_KUNPCKDQ.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KUNPCKBW/KUNPCKWD/KUNPCKDQ—Unpack for Mask Registers </title></head>
 8 | <body>
 9 | <h1>KUNPCKBW/KUNPCKWD/KUNPCKDQ—Unpack for Mask Registers</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDS.L1.66.0F.W0 4B /r KUNPCKBW k1, k2, k3</td>
19 | <td>RVR</td>
20 | <td>V/V</td>
21 | <td>AVX512F</td>
22 | <td>Unpack and interleave 8 bits masks in k2 and k3 and write word result in k1.</td></tr>
23 | <tr>
24 | <td>VEX.NDS.L1.0F.W0 4B /r KUNPCKWD k1, k2, k3</td>
25 | <td>RVR</td>
26 | <td>V/V</td>
27 | <td>AVX512BW</td>
28 | <td>Unpack and interleave 16 bits in k2 and k3 and write double-word result in k1.</td></tr>
29 | <tr>
30 | <td>VEX.NDS.L1.0F.W1 4B /r KUNPCKDQ k1, k2, k3</td>
31 | <td>RVR</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Unpack and interleave 32 bits masks in k2 and k3 and write quadword result in k1.</td></tr></table>
35 | <h3>Instruction Operand Encoding</h3>
36 | <table>
37 | <tr>
38 | <td>Op/En</td>
39 | <td>Operand 1</td>
40 | <td>Operand 2</td>
41 | <td>Operand 3</td></tr>
42 | <tr>
43 | <td>RVR</td>
44 | <td>ModRM:reg (w)</td>
45 | <td>VEX.1vvv (r)</td>
46 | <td>ModRM:r/m (r, ModRM:[7:6] must be 11b)</td></tr></table>
47 | <h2>Description</h2>
48 | <p>Unpacks the lower 8/16/32 bits of the second and third operands (source operands) into the low part of the first operand (destination operand), starting from the low bytes. The result is zero-extended in the destination.</p>
49 | <h2>Operation</h2>
50 | <p><strong>KUNPCKBW</strong></p>
51 | <pre>DEST[7:0] (cid:197) SRC2[7:0]
52 | DEST[15:8] (cid:197) SRC1[7:0]
53 | DEST[MAX_KL-1:16] (cid:197) 0</pre>
54 | <p><strong>KUNPCKWD</strong></p>
55 | <pre>DEST[15:0] (cid:197) SRC2[15:0]
56 | DEST[31:16] (cid:197) SRC1[15:0] DEST[MAX_KL-1:32] (cid:197) 0</pre>
57 | <p><strong>KUNPCKDQ</strong></p>
58 | <pre>DEST[31:0] (cid:197) SRC2[31:0]
59 | DEST[63:32] (cid:197) SRC1[31:0] DEST[MAX_KL-1:64] (cid:197) 0</pre>
60 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
61 | <p>KUNPCKBW __mmask16 _mm512_kunpackb(__mmask16 a, __mmask16 b);</p>
62 | <p>KUNPCKDQ __mmask64 _mm512_kunpackd(__mmask64 a, __mmask64 b);</p>
63 | <p>KUNPCKWD __mmask32 _mm512_kunpackw(__mmask32 a, __mmask32 b);</p>
64 | <h2>Flags Affected</h2>
65 | <p>None</p>
66 | <h2>SIMD Floating-Point Exceptions</h2>
67 | <p>None</p>
68 | <h2>Other Exceptions</h2>
69 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/KXNORW_KXNORB_KXNORQ_KXNORD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KXNORW/KXNORB/KXNORQ/KXNORD—Bitwise Logical XNOR Masks </title></head>
 8 | <body>
 9 | <h1>KXNORW/KXNORB/KXNORQ/KXNORD—Bitwise Logical XNOR Masks</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDS.L1.0F.W0 46 /r KXNORW k1, k2, k3</td>
19 | <td>RVR</td>
20 | <td>V/V</td>
21 | <td>AVX512F</td>
22 | <td>Bitwise XNOR 16 bits masks k2 and k3 and place result in k1.</td></tr>
23 | <tr>
24 | <td>VEX.L1.66.0F.W0 46 /r KXNORB k1, k2, k3</td>
25 | <td>RVR</td>
26 | <td>V/V</td>
27 | <td>AVX512DQ</td>
28 | <td>Bitwise XNOR 8 bits masks k2 and k3 and place result in k1.</td></tr>
29 | <tr>
30 | <td>VEX.L1.0F.W1 46 /r KXNORQ k1, k2, k3</td>
31 | <td>RVR</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Bitwise XNOR 64 bits masks k2 and k3 and place result in k1.</td></tr>
35 | <tr>
36 | <td>VEX.L1.66.0F.W1 46 /r KXNORD k1, k2, k3</td>
37 | <td>RVR</td>
38 | <td>V/V</td>
39 | <td>AVX512BW</td>
40 | <td>Bitwise XNOR 32 bits masks k2 and k3 and place result in k1.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <table>
43 | <tr>
44 | <td>Op/En</td>
45 | <td>Operand 1</td>
46 | <td>Operand 2</td>
47 | <td>Operand 3</td></tr>
48 | <tr>
49 | <td>RVR</td>
50 | <td>ModRM:reg (w)</td>
51 | <td>VEX.1vvv (r)</td>
52 | <td>ModRM:r/m (r, ModRM:[7:6] must be 11b)</td></tr></table>
53 | <h2>Description</h2>
54 | <p>Performs a bitwise XNOR between the vector mask k2 and the vector mask k3, and writes the result into vector mask k1 (three-operand form).</p>
55 | <h2>Operation</h2>
56 | <p><strong>KXNORW</strong></p>
57 | <pre>DEST[15:0] (cid:197) NOT (SRC1[15:0] BITWISE XOR SRC2[15:0])
58 | DEST[MAX_KL-1:16] (cid:197) 0</pre>
59 | <p><strong>KXNORB</strong></p>
60 | <pre>DEST[7:0] (cid:197) NOT (SRC1[7:0] BITWISE XOR SRC2[7:0])
61 | DEST[MAX_KL-1:8] (cid:197) 0</pre>
62 | <p><strong>KXNORQ</strong></p>
63 | <pre>DEST[63:0] (cid:197) NOT (SRC1[63:0] BITWISE XOR SRC2[63:0])
64 | DEST[MAX_KL-1:64] (cid:197) 0</pre>
65 | <p><strong>KXNORD</strong></p>
66 | <pre>DEST[31:0] (cid:197) NOT (SRC1[31:0] BITWISE XOR SRC2[31:0])
67 | DEST[MAX_KL-1:32] (cid:197) 0</pre>
68 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
69 | <p>KXNORW __mmask16 _mm512_kxnor(__mmask16 a, __mmask16 b);</p>
70 | <h2>Flags Affected</h2>
71 | <p>None</p>
72 | <h2>SIMD Floating-Point Exceptions</h2>
73 | <p>None</p>
74 | <h2>Other Exceptions</h2>
75 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/KXORW_KXORB_KXORQ_KXORD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>KXORW/KXORB/KXORQ/KXORD—Bitwise Logical XOR Masks </title></head>
 8 | <body>
 9 | <h1>KXORW/KXORB/KXORQ/KXORD—Bitwise Logical XOR Masks</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDS.L1.0F.W0 47 /r KXORW k1, k2, k3</td>
19 | <td>RVR</td>
20 | <td>V/V</td>
21 | <td>AVX512F</td>
22 | <td>Bitwise XOR 16 bits masks k2 and k3 and place result in k1.</td></tr>
23 | <tr>
24 | <td>VEX.L1.66.0F.W0 47 /r KXORB k1, k2, k3</td>
25 | <td>RVR</td>
26 | <td>V/V</td>
27 | <td>AVX512DQ</td>
28 | <td>Bitwise XOR 8 bits masks k2 and k3 and place result in k1.</td></tr>
29 | <tr>
30 | <td>VEX.L1.0F.W1 47 /r KXORQ k1, k2, k3</td>
31 | <td>RVR</td>
32 | <td>V/V</td>
33 | <td>AVX512BW</td>
34 | <td>Bitwise XOR 64 bits masks k2 and k3 and place result in k1.</td></tr>
35 | <tr>
36 | <td>VEX.L1.66.0F.W1 47 /r KXORD k1, k2, k3</td>
37 | <td>RVR</td>
38 | <td>V/V</td>
39 | <td>AVX512BW</td>
40 | <td>Bitwise XOR 32 bits masks k2 and k3 and place result in k1.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <table>
43 | <tr>
44 | <td>Op/En</td>
45 | <td>Operand 1</td>
46 | <td>Operand 2</td>
47 | <td>Operand 3</td></tr>
48 | <tr>
49 | <td>RVR</td>
50 | <td>ModRM:reg (w)</td>
51 | <td>VEX.1vvv (r)</td>
52 | <td>ModRM:r/m (r, ModRM:[7:6] must be 11b)</td></tr></table>
53 | <h2>Description</h2>
54 | <p>Performs a bitwise XOR between the vector mask k2 and the vector mask k3, and writes the result into vector mask k1 (three-operand form).</p>
55 | <h2>Operation</h2>
56 | <p><strong>KXORW</strong></p>
57 | <pre>DEST[15:0] (cid:197) SRC1[15:0] BITWISE XOR SRC2[15:0]
58 | DEST[MAX_KL-1:16] (cid:197) 0</pre>
59 | <p><strong>KXORB</strong></p>
60 | <pre>DEST[7:0] (cid:197) SRC1[7:0] BITWISE XOR SRC2[7:0]
61 | DEST[MAX_KL-1:8] (cid:197) 0</pre>
62 | <p><strong>KXORQ</strong></p>
63 | <pre>DEST[63:0] (cid:197) SRC1[63:0] BITWISE XOR SRC2[63:0]
64 | DEST[MAX_KL-1:64] (cid:197) 0</pre>
65 | <p><strong>KXORD</strong></p>
66 | <pre>DEST[31:0] (cid:197) SRC1[31:0] BITWISE XOR SRC2[31:0]
67 | DEST[MAX_KL-1:32] (cid:197) 0</pre>
68 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
69 | <p>KXORW __mmask16 _mm512_kxor(__mmask16 a, __mmask16 b);</p>
70 | <h2>Flags Affected</h2>
71 | <p>None</p>
72 | <h2>SIMD Floating-Point Exceptions</h2>
73 | <p>None</p>
74 | <h2>Other Exceptions</h2>
75 | <p>See Exceptions Type K20.</p></body></html>


--------------------------------------------------------------------------------
/html/LAHF.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>LAHF—Load Status Flags into AH Register </title></head>
 8 | <body>
 9 | <h1>LAHF—Load Status Flags into AH Register</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>9F</td>
20 | <td>LAHF</td>
21 | <td>NP</td>
22 | <td>Invalid*</td>
23 | <td>Valid</td>
24 | <td>Load: AH ← EFLAGS(SF:ZF:0:AF:0:PF:1:CF).</td></tr></table>
25 | <p><strong>NOTES: *Valid in specific steppings. See Description section.</strong></p>
26 | <h3>Instruction Operand Encoding</h3>
27 | <table>
28 | <tr>
29 | <td>Op/En</td>
30 | <td>Operand 1</td>
31 | <td>Operand 2</td>
32 | <td>Operand 3</td>
33 | <td>Operand 4</td></tr>
34 | <tr>
35 | <td>NP</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td>
39 | <td>NA</td></tr></table>
40 | <h2>Description</h2>
41 | <p>This instruction executes as described above in compatibility mode and legacy mode. It is valid in 64-bit mode only if CPUID.80000001H:ECX.LAHF-SAHF[bit 0] = 1.</p>
42 | <h2>Operation</h2>
43 | <pre>IF 64-Bit Mode
44 |     THEN
45 |          IF CPUID.80000001H:ECX.LAHF-SAHF[bit 0] = 1;
46 |               THEN AH ← RFLAGS(SF:ZF:0:AF:0:PF:1:CF); ELSE #UD;
47 |          FI;
48 |     ELSE
49 |          AH ← EFLAGS(SF:ZF:0:AF:0:PF:1:CF);
50 | FI;</pre>
51 | <h2>Flags Affected</h2>
52 | <p>None. The state of the flags in the EFLAGS register is not affected.</p>
53 | <h2>Protected Mode Exceptions</h2>
54 | <table class="exception-table">
55 | <tr>
56 | <td>#UD</td>
57 | <td>If the LOCK prefix is used.</td></tr></table>
58 | <h2>Real-Address Mode Exceptions</h2>
59 | <p>Same exceptions as in protected mode.</p>
60 | <h2>Virtual-8086 Mode Exceptions</h2>
61 | <p>Same exceptions as in protected mode.</p>
62 | <h2>Compatibility Mode Exceptions</h2>
63 | <p>Same exceptions as in protected mode.</p>
64 | <h2>64-Bit Mode Exceptions</h2>
65 | <table class="exception-table">
66 | <tr>
67 | <td>#UD</td>
68 | <td>
69 | <p>If CPUID.80000001H:ECX.LAHF-SAHF[bit 0] = 0.</p>
70 | <p>If the LOCK prefix is used.</p></td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/LDDQU.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>LDDQU—Load Unaligned Integer 128 Bits </title></head>
 8 | <body>
 9 | <h1>LDDQU—Load Unaligned Integer 128 Bits</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32-bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>F2 0F F0 /<em>r</em></p>
20 | <p>LDDQU <em>xmm1</em>, <em>mem</em></p></td>
21 | <td>RM</td>
22 | <td>V/V</td>
23 | <td>SSE3</td>
24 | <td>Load unaligned data from <em>mem</em> and return double quadword in <em>xmm1</em>.</td></tr>
25 | <tr>
26 | <td>
27 | <p>VEX.128.F2.0F.WIG F0 /r</p>
28 | <p>VLDDQU xmm1, m128</p></td>
29 | <td>RM</td>
30 | <td>V/V</td>
31 | <td>AVX</td>
32 | <td>Load unaligned packed integer values from mem to xmm1.</td></tr>
33 | <tr>
34 | <td>
35 | <p>VEX.256.F2.0F.WIG F0 /r</p>
36 | <p>VLDDQU ymm1, m256</p></td>
37 | <td>RM</td>
38 | <td>V/V</td>
39 | <td>AVX</td>
40 | <td>Load unaligned packed integer values from mem to ymm1.</td></tr></table>
41 | <h3>Instruction Operand Encoding</h3>
42 | <table>
43 | <tr>
44 | <td>Op/En</td>
45 | <td>Operand 1</td>
46 | <td>Operand 2</td>
47 | <td>Operand 3</td>
48 | <td>Operand 4</td></tr>
49 | <tr>
50 | <td>RM</td>
51 | <td>ModRM:reg (w)</td>
52 | <td>ModRM:r/m (r)</td>
53 | <td>NA</td>
54 | <td>NA</td></tr></table>
55 | <h2>Description</h2>
56 | <p>The instruction is <em>functionally similar </em>to (V)MOVDQU ymm/xmm, m256/m128 for loading from memory. That is: 32/16 bytes of data starting at an address specified by the source memory operand (second operand) are fetched from memory and placed in a destination register (first operand). The source operand need not be aligned on a 32/16-byte boundary. Up to 64/32 bytes may be loaded from memory; this is implementation dependent.</p>
57 | <p>This instruction may improve performance relative to (V)MOVDQU if the source operand crosses a cache line boundary. In situations that require the data loaded by (V)LDDQU be modified and stored to the same location, use (V)MOVDQU or (V)MOVDQA instead of (V)LDDQU. To move a double quadword to or from memory locations that are known to be aligned on 16-byte boundaries, use the (V)MOVDQA instruction.</p>
58 | <h2>Implementation Notes</h2>
59 | <p>In 64-bit mode, use of the REX.R prefix permits this instruction to access additional registers (XMM8-XMM15).</p>
60 | <p>Note: In VEX-encoded versions, VEX.vvvv is reserved and must be 1111b otherwise instructions will #UD.</p>
61 | <h2>Operation</h2>
62 | <p><strong>LDDQU (128-bit Legacy SSE version)</strong></p>
63 | <pre>DEST[127:0] (cid:197) SRC[127:0]
64 | DEST[VLMAX-1:128] (Unmodified)</pre>
65 | <p><strong>VLDDQU (VEX.128 encoded version)</strong></p>
66 | <pre>DEST[127:0] (cid:197) SRC[127:0]
67 | DEST[VLMAX-1:128] (cid:197) 0</pre>
68 | <p><strong>VLDDQU (VEX.256 encoded version)</strong></p>
69 | <pre>DEST[255:0] (cid:197) SRC[255:0]</pre>
70 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
71 | <p>LDDQU:</p>
72 | <p>__m128i _mm_lddqu_si128 (__m128i * p);</p>
73 | <p>VLDDQU: __m256i _mm256_lddqu_si256 (__m256i * p);</p>
74 | <h2>Numeric Exceptions</h2>
75 | <p>None</p>
76 | <h2>Other Exceptions</h2>
77 | <p>See Exceptions Type 4;</p>
78 | <p>Note treatment of #AC varies.</p></body></html>


--------------------------------------------------------------------------------
/html/LDMXCSR.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>LDMXCSR—Load MXCSR Register </title></head>
 8 | <body>
 9 | <h1>LDMXCSR—Load MXCSR Register</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32-bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F AE /2</p>
20 | <p>LDMXCSR <em>m32</em></p></td>
21 | <td>M</td>
22 | <td>V/V</td>
23 | <td>SSE</td>
24 | <td>Load MXCSR register from <em>m32</em>.</td></tr>
25 | <tr>
26 | <td>
27 | <p>VEX.LZ.0F.WIG AE /2</p>
28 | <p>VLDMXCSR <em>m32</em></p></td>
29 | <td>M</td>
30 | <td>V/V</td>
31 | <td>AVX</td>
32 | <td>Load MXCSR register from <em>m32.</em></td></tr></table>
33 | <h3>Instruction Operand Encoding</h3>
34 | <table>
35 | <tr>
36 | <td>Op/En</td>
37 | <td>Operand 1</td>
38 | <td>Operand 2</td>
39 | <td>Operand 3</td>
40 | <td>Operand 4</td></tr>
41 | <tr>
42 | <td>M</td>
43 | <td>ModRM:r/m (r)</td>
44 | <td>NA</td>
45 | <td>NA</td>
46 | <td>NA</td></tr></table>
47 | <h2>Description</h2>
48 | <p>Loads the source operand into the MXCSR control/status register. The source operand is a 32-bit memory location. See “MXCSR Control and Status Register” in Chapter 10, of the <em>Intel® 64 and IA-32 Architectures Software Devel-oper’s Manual, Volume 1</em>, for a description of the MXCSR register and its contents.</p>
49 | <p>The LDMXCSR instruction is typically used in conjunction with the (V)STMXCSR instruction, which stores the contents of the MXCSR register in memory.</p>
50 | <p>The default MXCSR value at reset is 1F80H.</p>
51 | <p>If a (V)LDMXCSR instruction clears a SIMD floating-point exception mask bit and sets the corresponding exception flag bit, a SIMD floating-point exception will not be immediately generated. The exception will be generated only upon the execution of the next instruction that meets both conditions below:</p>
52 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
53 | <p>If VLDMXCSR is encoded with VEX.L= 1, an attempt to execute the instruction encoded with VEX.L= 1 will cause an #UD exception.</p>
54 | <p>Note: In VEX-encoded versions, VEX.vvvv is reserved and must be 1111b, otherwise instructions will #UD.</p>
55 | <h2>Operation</h2>
56 | <pre>MXCSR ← m32;</pre>
57 | <h2>C/C++ Compiler Intrinsic Equivalent</h2>
58 | <p>_mm_setcsr(unsigned int i)</p>
59 | <h2>Numeric Exceptions</h2>
60 | <p>None</p>
61 | <h2>Other Exceptions</h2>
62 | <p>See Exceptions Type 5; additionally</p>
63 | <table class="exception-table">
64 | <tr>
65 | <td>#GP</td>
66 | <td>For an attempt to set reserved bits in MXCSR.</td></tr>
67 | <tr>
68 | <td>#UD</td>
69 | <td>If VEX.vvvv ≠ 1111B.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/LFENCE.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>LFENCE—Load Fence </title></head>
 8 | <body>
 9 | <h1>LFENCE—Load Fence</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F AE E8</td>
20 | <td>LFENCE</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Serializes load operations.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Performs a serializing operation on all load-from-memory instructions that were issued prior the LFENCE instruc-tion. Specifically, LFENCE does not execute until all prior instructions have completed locally, and no later instruc-tion begins execution until LFENCE completes. In particular, an instruction that loads from memory and that precedes an LFENCE receives data from memory prior to completion of the LFENCE. (An LFENCE that follows an instruction that stores to memory might complete <strong>before</strong> the data being stored have become globally visible.) Instructions following an LFENCE may be fetched from memory before the LFENCE, but they will not execute until the LFENCE completes.</p>
41 | <p>Weakly ordered memory types can be used to achieve higher processor performance through such techniques as out-of-order issue and speculative reads. The degree to which a consumer of data recognizes or knows that the data is weakly ordered varies among applications and may be unknown to the producer of this data. The LFENCE instruction provides a performance-efficient way of ensuring load ordering between routines that produce weakly-ordered results and routines that consume that data.</p>
42 | <p>Processors are free to fetch and cache data speculatively from regions of system memory that use the WB, WC, and WT memory types. This speculative fetching can occur at any time and is not tied to instruction execution. Thus, it is not ordered with respect to executions of the LFENCE instruction; data can be brought into the caches specula-tively just before, during, or after the execution of an LFENCE instruction.</p>
43 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
44 | <p>Specification of the instruction's opcode above indicates a ModR/M byte of E8. For this instruction, the processor ignores the r/m field of the ModR/M byte. Thus, LFENCE is encoded by any opcode of the form 0F AE Ex, where x is in the range 8-F.</p>
45 | <h2>Operation</h2>
46 | <pre>Wait_On_Following_Instructions_Until(preceding_instructions_complete);</pre>
47 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
48 | <p>void _mm_lfence(void)</p>
49 | <h2>Exceptions (All Modes of Operation)</h2>
50 | <p>#UD</p>
51 | <p>If CPUID.01H:EDX.SSE2[bit 26] = 0.</p>
52 | <p>If the LOCK prefix is used.</p></body></html>


--------------------------------------------------------------------------------
/html/MOVDQ2Q.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>MOVDQ2Q—Move Quadword from XMM to MMX Technology Register </title></head>
 8 | <body>
 9 | <h1>MOVDQ2Q—Move Quadword from XMM to MMX Technology Register</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>F2 0F D6 /r</td>
20 | <td>MOVDQ2Q <em>mm</em>, <em>xmm</em></td>
21 | <td>RM</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Move low quadword from <em>xmm</em> to <em>mmx </em>register.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>RM</td>
35 | <td>ModRM:reg (w)</td>
36 | <td>ModRM:r/m (r)</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Moves the low quadword from the source operand (second operand) to the destination operand (first operand). The source operand is an XMM register and the destination operand is an MMX technology register.</p>
41 | <p>This instruction causes a transition from x87 FPU to MMX technology operation (that is, the x87 FPU top-of-stack pointer is set to 0 and the x87 FPU tag word is set to all 0s [valid]). If this instruction is executed while an x87 FPU floating-point exception is pending, the exception is handled before the MOVDQ2Q instruction is executed.</p>
42 | <p>In 64-bit mode, use of the REX.R prefix permits this instruction to access additional registers (XMM8-XMM15).</p>
43 | <h2>Operation</h2>
44 | <pre>DEST ← SRC[63:0];</pre>
45 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
46 | <p>MOVDQ2Q:</p>
47 | <p>__m64 _mm_movepi64_pi64 ( __m128i a)</p>
48 | <h2>SIMD Floating-Point Exceptions</h2>
49 | <p>None.</p>
50 | <h2>Protected Mode Exceptions</h2>
51 | <table class="exception-table">
52 | <tr>
53 | <td>#NM</td>
54 | <td>If CR0.TS[bit 3] = 1.</td></tr>
55 | <tr>
56 | <td>#UD</td>
57 | <td>
58 | <p>If CR0.EM[bit 2] = 1.</p>
59 | <p>If CR4.OSFXSR[bit 9] = 0.</p>
60 | <p>If CPUID.01H:EDX.SSE2[bit 26] = 0.</p>
61 | <p>If the LOCK prefix is used.</p></td></tr>
62 | <tr>
63 | <td>#MF</td>
64 | <td>If there is a pending x87 FPU exception.</td></tr></table>
65 | <h2>Real-Address Mode Exceptions</h2>
66 | <p>Same exceptions as in protected mode.</p>
67 | <h2>Virtual-8086 Mode Exceptions</h2>
68 | <p>Same exceptions as in protected mode.</p>
69 | <h2>Compatibility Mode Exceptions</h2>
70 | <p>Same exceptions as in protected mode.</p>
71 | <h2>64-Bit Mode Exceptions</h2>
72 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/MOVNTQ.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>MOVNTQ—Store of Quadword Using Non-Temporal Hint </title></head>
 8 | <body>
 9 | <h1>MOVNTQ—Store of Quadword Using Non-Temporal Hint</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F E7 /<em>r</em></td>
20 | <td>MOVNTQ <em>m64</em>, <em>mm</em></td>
21 | <td>MR</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Move quadword from <em>mm</em> to <em>m64 </em>using non-temporal hint.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>MR</td>
35 | <td>ModRM:r/m (w)</td>
36 | <td>ModRM:reg (r)</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Moves the quadword in the source operand (second operand) to the destination operand (first operand) using a non-temporal hint to minimize cache pollution during the write to memory. The source operand is an MMX tech-nology register, which is assumed to contain packed integer data (packed bytes, words, or doublewords). The destination operand is a 64-bit memory location.</p>
41 | <p>The non-temporal hint is implemented by using a write combining (WC) memory type protocol when writing the data to memory. Using this protocol, the processor does not write the data into the cache hierarchy, nor does it fetch the corresponding cache line from memory into the cache hierarchy. The memory type of the region being written to can override the non-temporal hint, if the memory address specified for the non-temporal store is in an uncacheable (UC) or write protected (WP) memory region. For more information on non-temporal stores, see “Caching of Temporal vs. Non-Temporal Data” in Chapter 10 in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 1</em>.</p>
42 | <p>Because the WC protocol uses a weakly-ordered memory consistency model, a fencing operation implemented with the SFENCE or MFENCE instruction should be used in conjunction with MOVNTQ instructions if multiple processors might use different memory types to read/write the destination memory locations.</p>
43 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
44 | <h2>Operation</h2>
45 | <pre>DEST ← SRC;</pre>
46 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
47 | <p>MOVNTQ:</p>
48 | <p>void _mm_stream_pi(__m64 * p, __m64 a)</p>
49 | <h2>SIMD Floating-Point Exceptions</h2>
50 | <p>None.</p>
51 | <h2>Other Exceptions</h2>
52 | <p>See Table 22-8, “Exception Conditions for Legacy SIMD/MMX Instructions without FP Exception,” in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3A</em>.</p></body></html>


--------------------------------------------------------------------------------
/html/MOVQ2DQ.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>MOVQ2DQ—Move Quadword from MMX Technology to XMM Register </title></head>
 8 | <body>
 9 | <h1>MOVQ2DQ—Move Quadword from MMX Technology to XMM Register</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>F3 0F D6 /r</td>
20 | <td>MOVQ2DQ <em>xmm</em>, <em>mm</em></td>
21 | <td>RM</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Move quadword from <em>mmx</em> to low quadword of <em>xmm</em>.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>RM</td>
35 | <td>ModRM:reg (w)</td>
36 | <td>ModRM:r/m (r)</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Moves the quadword from the source operand (second operand) to the low quadword of the destination operand (first operand). The source operand is an MMX technology register and the destination operand is an XMM register.</p>
41 | <p>This instruction causes a transition from x87 FPU to MMX technology operation (that is, the x87 FPU top-of-stack pointer is set to 0 and the x87 FPU tag word is set to all 0s [valid]). If this instruction is executed while an x87 FPU floating-point exception is pending, the exception is handled before the MOVQ2DQ instruction is executed.</p>
42 | <p>In 64-bit mode, use of the REX.R prefix permits this instruction to access additional registers (XMM8-XMM15).</p>
43 | <h2>Operation</h2>
44 | <pre>DEST[63:0] ← SRC[63:0];
45 | DEST[127:64] ← 00000000000000000H;</pre>
46 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
47 | <p>MOVQ2DQ:</p>
48 | <p>__128i _mm_movpi64_pi64 ( __m64 a)</p>
49 | <h2>SIMD Floating-Point Exceptions</h2>
50 | <p>None.</p>
51 | <h2>Protected Mode Exceptions</h2>
52 | <table class="exception-table">
53 | <tr>
54 | <td>#NM</td>
55 | <td>If CR0.TS[bit 3] = 1.</td></tr>
56 | <tr>
57 | <td>#UD</td>
58 | <td>
59 | <p>If CR0.EM[bit 2] = 1.</p>
60 | <p>If CR4.OSFXSR[bit 9] = 0.</p>
61 | <p>If CPUID.01H:EDX.SSE2[bit 26] = 0.</p>
62 | <p>If the LOCK prefix is used.</p></td></tr>
63 | <tr>
64 | <td>#MF</td>
65 | <td>If there is a pending x87 FPU exception.</td></tr></table>
66 | <h2>Real-Address Mode Exceptions</h2>
67 | <p>Same exceptions as in protected mode.</p>
68 | <h2>Virtual-8086 Mode Exceptions</h2>
69 | <p>Same exceptions as in protected mode.</p>
70 | <h2>Compatibility Mode Exceptions</h2>
71 | <p>Same exceptions as in protected mode.</p>
72 | <h2>64-Bit Mode Exceptions</h2>
73 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/MULX.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>MULX — Unsigned Multiply Without Affecting Flags </title></head>
 8 | <body>
 9 | <h1>MULX — Unsigned Multiply Without Affecting Flags</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 -bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>VEX.NDD.LZ.F2.0F38.W0 F6 /r</p>
20 | <p>MULX <em>r32a, r32b, r/m32</em></p></td>
21 | <td>RVM</td>
22 | <td>V/V</td>
23 | <td>BMI2</td>
24 | <td>Unsigned multiply of <em>r/m32</em> with EDX without affecting arithmetic flags.</td></tr>
25 | <tr>
26 | <td>
27 | <p>VEX.NDD.LZ.F2.0F38.W1 F6 /r</p>
28 | <p>MULX <em>r64a, r64b, r/m64</em></p></td>
29 | <td>RVM</td>
30 | <td>V/N.E.</td>
31 | <td>BMI2</td>
32 | <td>Unsigned multiply of <em>r/m64</em> with RDX without affecting arithmetic flags.</td></tr></table>
33 | <h3>Instruction Operand Encoding</h3>
34 | <table>
35 | <tr>
36 | <td>
37 | <p>Op/En</p>
38 | <p>RVM</p></td>
39 | <td>
40 | <p>Operand 1</p>
41 | <p>ModRM:reg (w)</p></td>
42 | <td>
43 | <p>Operand 2</p>
44 | <p>VEX.vvvv (w)</p></td>
45 | <td>
46 | <p>Operand 3</p>
47 | <p>ModRM:r/m (r)</p></td>
48 | <td>
49 | <p>Operand 4</p>
50 | <p>RDX/EDX is implied 64/32 bits</p>
51 | <p>source</p></td></tr></table>
52 | <h2>Description</h2>
53 | <p>Performs an unsigned multiplication of the implicit source operand (EDX/RDX) and the specified source operand (the third operand) and stores the low half of the result in the second destination (second operand), the high half of the result in the first destination operand (first operand), without reading or writing the arithmetic flags. This enables efficient programming where the software can interleave add with carry operations and multiplications.</p>
54 | <p>If the first and second operand are identical, it will contain the high half of the multiplication result.</p>
55 | <p>This instruction is not supported in real mode and virtual-8086 mode. The operand size is always 32 bits if not in 64-bit mode. In 64-bit mode operand size 64 requires VEX.W1. VEX.W1 is ignored in non-64-bit modes. An attempt to execute this instruction with VEX.L not equal to 0 will cause #UD.</p>
56 | <h2>Operation</h2>
57 | <pre>// DEST1: ModRM:reg
58 | // DEST2: VEX.vvvv
59 | IF (OperandSize = 32)
60 |     SRC1 ← EDX;
61 |     DEST2 ← (SRC1*SRC2)[31:0];
62 |     DEST1 ← (SRC1*SRC2)[63:32];
63 | ELSE IF (OperandSize = 64)
64 |     SRC1 ← RDX;
65 |          DEST2 ← (SRC1*SRC2)[63:0];
66 |          DEST1 ← (SRC1*SRC2)[127:64];
67 | FI</pre>
68 | <h2>Flags Affected</h2>
69 | <p>None</p>
70 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
71 | <p>Auto-generated from high-level language when possible.</p>
72 | <p>unsigned int mulx_u32(unsigned int a, unsigned int b, unsigned int * hi);</p>
73 | <p>unsigned __int64 mulx_u64(unsigned __int64 a, unsigned __int64 b, unsigned __int64 * hi);</p>
74 | <h2>SIMD Floating-Point Exceptions</h2>
75 | <p>None</p>
76 | <h2>Other Exceptions</h2>
77 | <p>See Section 2.5.1, “Exception Conditions for VEX-Encoded GPR Instructions”, Table 2-29; additionally</p>
78 | <table class="exception-table">
79 | <tr>
80 | <td>#UD</td>
81 | <td>If VEX.W = 1.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/PAUSE.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>PAUSE—Spin Loop Hint </title></head>
 8 | <body>
 9 | <h1>PAUSE—Spin Loop Hint</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>F3 90</td>
20 | <td>PAUSE</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Gives hint to processor that improves performance of spin-wait loops.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Improves the performance of spin-wait loops. When executing a “spin-wait loop,” processors will suffer a severe performance penalty when exiting the loop because it detects a possible memory order violation. The PAUSE instruction provides a hint to the processor that the code sequence is a spin-wait loop. The processor uses this hint to avoid the memory order violation in most situations, which greatly improves processor performance. For this reason, it is recommended that a PAUSE instruction be placed in all spin-wait loops.</p>
41 | <p>An additional function of the PAUSE instruction is to reduce the power consumed by a processor while executing a spin loop. A processor can execute a spin-wait loop extremely quickly, causing the processor to consume a lot of power while it waits for the resource it is spinning on to become available. Inserting a pause instruction in a spin-wait loop greatly reduces the processor’s power consumption.</p>
42 | <p>This instruction was introduced in the Pentium 4 processors, but is backward compatible with all IA-32 processors. In earlier IA-32 processors, the PAUSE instruction operates like a NOP instruction. The Pentium 4 and Intel Xeon processors implement the PAUSE instruction as a delay. The delay is finite and can be zero for some processors. This instruction does not change the architectural state of the processor (that is, it performs essentially a delaying no-op operation).</p>
43 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
44 | <h2>Operation</h2>
45 | <pre>Execute_Next_Instruction(DELAY);</pre>
46 | <h2>Numeric Exceptions</h2>
47 | <p>None.</p>
48 | <h2>Exceptions (All Operating Modes)</h2>
49 | <table class="exception-table">
50 | <tr>
51 | <td>#UD</td>
52 | <td>If the LOCK prefix is used.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/PSHUFW.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>PSHUFW—Shuffle Packed Words </title></head>
 8 | <body>
 9 | <h1>PSHUFW—Shuffle Packed Words</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64-Bit Mode</th>
15 | <th>Compat/Leg Mode</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 70 /<em>r</em> ib</p>
20 | <p>PSHUFW <em>mm1, mm2/m64, imm8</em></p></td>
21 | <td>RMI</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Shuffle the words in <em>mm2/m64</em> based on the encoding in <em>imm8</em> and store the result in <em>mm1</em>.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>RMI</td>
35 | <td>ModRM:reg (w)</td>
36 | <td>ModRM:r/m (r)</td>
37 | <td>imm8</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Copies words from the source operand (second operand) and inserts them in the destination operand (first operand) at word locations selected with the order operand (third operand). This operation is similar to the opera-tion used by the PSHUFD instruction, which is illustrated in Figure 4-16. For the PSHUFW instruction, each 2-bit field in the order operand selects the contents of one word location in the destination operand. The encodings of the order operand fields select words from the source operand to be copied to the destination operand.</p>
41 | <p>The source operand can be an MMX technology register or a 64-bit memory location. The destination operand is an MMX technology register. The order operand is an 8-bit immediate. Note that this instruction permits a word in the source operand to be copied to more than one word location in the destination operand.</p>
42 | <p>In 64-bit mode, using a REX prefix in the form of REX.R permits this instruction to access additional registers (XMM8-XMM15).</p>
43 | <h2>Operation</h2>
44 | <pre>DEST[15:0] ← (SRC &gt;&gt; (ORDER[1:0] * 16))[15:0];
45 | DEST[31:16] ← (SRC &gt;&gt; (ORDER[3:2] * 16))[15:0];
46 | DEST[47:32] ← (SRC &gt;&gt; (ORDER[5:4] * 16))[15:0];
47 | DEST[63:48] ← (SRC &gt;&gt; (ORDER[7:6] * 16))[15:0];</pre>
48 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
49 | <p>PSHUFW:</p>
50 | <p>__m64 _mm_shuffle_pi16(__m64 a, int n)</p>
51 | <h2>Flags Affected</h2>
52 | <p>None.</p>
53 | <h2>Numeric Exceptions</h2>
54 | <p>None.</p>
55 | <h2>Other Exceptions</h2>
56 | <p>See Table 22-7, “Exception Conditions for SIMD/MMX Instructions with Memory Reference,” in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3A</em>.</p></body></html>


--------------------------------------------------------------------------------
/html/RDPID.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>RDPID—Read Processor ID </title></head>
 8 | <body>
 9 | <h1>RDPID—Read Processor ID</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32-bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>F3 0F C7 /7 RDPID r32</td>
19 | <td>M</td>
20 | <td>N.E./V</td>
21 | <td>RDPID</td>
22 | <td>Read IA32_TSC_AUX into r32.</td></tr>
23 | <tr>
24 | <td>F3 0F C7 /7 RDPID r64</td>
25 | <td>M</td>
26 | <td>V/N.E.</td>
27 | <td>RDPID</td>
28 | <td>Read IA32_TSC_AUX into r64.</td></tr></table>
29 | <h3>Instruction Operand Encoding</h3>
30 | <table>
31 | <tr>
32 | <td>Op/En</td>
33 | <td>Operand 1</td>
34 | <td>Operand 2</td>
35 | <td>Operand 3</td>
36 | <td>Operand 4</td></tr>
37 | <tr>
38 | <td>M</td>
39 | <td>ModRM:r/m (w)</td>
40 | <td>NA</td>
41 | <td>NA</td>
42 | <td>NA</td></tr></table>
43 | <h2>Description</h2>
44 | <p>Reads the value of the IA32_TSC_AUX MSR (address C0000103H) into the destination register. The value of CS.D and operand-size prefixes (66H and REX.W) do not affect the behavior of the RDPID instruction.</p>
45 | <h2>Operation</h2>
46 | <pre>DEST ← IA32_TSC_AUX</pre>
47 | <h2>Flags Affected</h2>
48 | <p>None.</p>
49 | <h2>Protected Mode Exceptions</h2>
50 | <table class="exception-table">
51 | <tr>
52 | <td>#UD</td>
53 | <td>
54 | <p>If the LOCK prefix is used.</p>
55 | <p>If the F2 prefix is used.</p>
56 | <p>If CPUID.7H.0:ECX.RDPID[bit 22] = 0.</p></td></tr></table>
57 | <h2>Real-Address Mode Exceptions</h2>
58 | <p>Same exceptions as in protected mode.</p>
59 | <h2>Virtual-8086 Mode Exceptions</h2>
60 | <p>Same exceptions as in protected mode.</p>
61 | <h2>Compatibility Mode Exceptions</h2>
62 | <p>Same exceptions as in protected mode.</p>
63 | <h2>64-Bit Mode Exceptions</h2>
64 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/RDPKRU.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>RDPKRU—Read Protection Key Rights for User Pages </title></head>
 8 | <body>
 9 | <h1>RDPKRU—Read Protection Key Rights for User Pages</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode*</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64/32bit Mode Support</th>
16 | <th>CPUID Feature Flag</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F 01 EE</td>
20 | <td>RDPKRU</td>
21 | <td>NP</td>
22 | <td>V/V</td>
23 | <td>OSPKE</td>
24 | <td>Reads PKRU into EAX.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Reads the value of PKRU into EAX and clears EDX. ECX must be 0 when RDPKRU is executed; otherwise, a general-protection exception (#GP) occurs.</p>
41 | <p>RDPKRU can be executed only if CR4.PKE = 1; otherwise, an invalid-opcode exception (#UD) occurs. Software can discover the value of CR4.PKE by examining CPUID.(EAX=07H,ECX=0H):ECX.OSPKE [bit 4].</p>
42 | <p>On processors that support the Intel 64 Architecture, the high-order 32-bits of RCX are ignored and the high-order 32-bits of RDX and RAX are cleared.</p>
43 | <h2>Operation</h2>
44 | <pre>IF (ECX = 0)
45 |     THEN
46 |          EAX ← PKRU;
47 |          EDX ← 0;
48 |     ELSE #GP(0);
49 | FI;</pre>
50 | <h2>Flags Affected</h2>
51 | <p>None.</p>
52 | <h2>C/C++ Compiler Intrinsic Equivalent</h2>
53 | <p>RDPKRU:</p>
54 | <p>uint32_t _rdpkru_u32(void);</p>
55 | <h2>Protected Mode Exceptions</h2>
56 | <table class="exception-table">
57 | <tr>
58 | <td>#GP(0)</td>
59 | <td>If ECX ≠ 0</td></tr>
60 | <tr>
61 | <td>#UD</td>
62 | <td>
63 | <p>If the LOCK prefix is used.</p>
64 | <p>If CR4.PKE = 0.</p></td></tr></table>
65 | <h2>Real-Address Mode Exceptions</h2>
66 | <p>Same exceptions as in protected mode.</p>
67 | <h2>Virtual-8086 Mode Exceptions</h2>
68 | <p>Same exceptions as in protected mode.</p>
69 | <h2>Compatibility Mode Exceptions</h2>
70 | <p>Same exceptions as in protected mode.</p>
71 | <h2>64-Bit Mode Exceptions</h2>
72 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/RORX.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>RORX — Rotate Right Logical Without Affecting Flags </title></head>
 8 | <body>
 9 | <h1>RORX — Rotate Right Logical Without Affecting Flags</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 -bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>VEX.LZ.F2.0F3A.W0 F0 /r ib</p>
20 | <p>RORX r32, <em>r/m32, imm8</em></p></td>
21 | <td>RMI</td>
22 | <td>V/V</td>
23 | <td>BMI2</td>
24 | <td>Rotate 32-bit <em>r/m32</em> right <em>imm8</em> times without affecting arithmetic flags.</td></tr>
25 | <tr>
26 | <td>
27 | <p>VEX.LZ.F2.0F3A.W1 F0 /r ib</p>
28 | <p>RORX r64, <em>r/m64, imm8</em></p></td>
29 | <td>RMI</td>
30 | <td>V/N.E.</td>
31 | <td>BMI2</td>
32 | <td>Rotate 64-bit <em>r/m64</em> right <em>imm8</em> times without affecting arithmetic flags.</td></tr></table>
33 | <h3>Instruction Operand Encoding</h3>
34 | <table>
35 | <tr>
36 | <td>Op/En</td>
37 | <td>Operand 1</td>
38 | <td>Operand 2</td>
39 | <td>Operand 3</td>
40 | <td>Operand 4</td></tr>
41 | <tr>
42 | <td>RMI</td>
43 | <td>ModRM:reg (w)</td>
44 | <td>ModRM:r/m (r)</td>
45 | <td>Imm8</td>
46 | <td>NA</td></tr></table>
47 | <h2>Description</h2>
48 | <p>Rotates the bits of second operand right by the count value specified in imm8 without affecting arithmetic flags. The RORX instruction does not read or write the arithmetic flags.</p>
49 | <p>This instruction is not supported in real mode and virtual-8086 mode. The operand size is always 32 bits if not in 64-bit mode. In 64-bit mode operand size 64 requires VEX.W1. VEX.W1 is ignored in non-64-bit modes. An attempt to execute this instruction with VEX.L not equal to 0 will cause #UD.</p>
50 | <h2>Operation</h2>
51 | <pre>IF (OperandSize = 32)
52 |     y ← imm8 AND 1FH;
53 |     DEST ← (SRC &gt;&gt; y) | (SRC &lt;&lt; (32-y));
54 | ELSEIF (OperandSize = 64 )
55 |     y ← imm8 AND 3FH;
56 |     DEST ← (SRC &gt;&gt; y) | (SRC &lt;&lt; (64-y));
57 | ENDIF</pre>
58 | <h2>Flags Affected</h2>
59 | <p>None</p>
60 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
61 | <p>Auto-generated from high-level language.</p>
62 | <h2>SIMD Floating-Point Exceptions</h2>
63 | <p>None</p>
64 | <h2>Other Exceptions</h2>
65 | <p>See Section 2.5.1, “Exception Conditions for VEX-Encoded GPR Instructions”, Table 2-29; additionally</p>
66 | <table class="exception-table">
67 | <tr>
68 | <td>#UD</td>
69 | <td>If VEX.W = 1.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/RSM.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>RSM—Resume from System Management Mode </title></head>
 8 | <body>
 9 | <h1>RSM—Resume from System Management Mode</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode*</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F AA</td>
20 | <td>RSM</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Resume operation of interrupted program.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Returns program control from system management mode (SMM) to the application program or operating-system procedure that was interrupted when the processor received an SMM interrupt. The processor’s state is restored from the dump created upon entering SMM. If the processor detects invalid state information during state restora-tion, it enters the shutdown state. The following invalid information can cause a shutdown:</p>
41 | <p>The contents of the model-specific registers are not affected by a return from SMM.</p>
42 | <p>The SMM state map used by RSM supports resuming processor context for non-64-bit modes and 64-bit mode.</p>
43 | <p>See Chapter 34, “System Management Mode,” in the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 3C</em>, for more information about SMM and the behavior of the RSM instruction.</p>
44 | <h2>Operation</h2>
45 | <pre>ReturnFromSMM;
46 | IF (IA-32e mode supported) or (CPUID DisplayFamily_DisplayModel = 06H_0CH )
47 |     THEN
48 |          ProcessorState ← Restore(SMMDump(IA-32e SMM STATE MAP));
49 |     Else
50 |          ProcessorState ← Restore(SMMDump(Non-32-Bit-Mode SMM STATE MAP));
51 | FI</pre>
52 | <h2>Flags Affected</h2>
53 | <p>All.</p>
54 | <h2>Protected Mode Exceptions</h2>
55 | <table class="exception-table">
56 | <tr>
57 | <td>#UD</td>
58 | <td>
59 | <p>If an attempt is made to execute this instruction when the processor is not in SMM.</p>
60 | <p>If the LOCK prefix is used.</p></td></tr></table>
61 | <h2>Real-Address Mode Exceptions</h2>
62 | <p>Same exceptions as in protected mode.</p>
63 | <h2>Virtual-8086 Mode Exceptions</h2>
64 | <p>Same exceptions as in protected mode.</p>
65 | <h2>Compatibility Mode Exceptions</h2>
66 | <p>Same exceptions as in protected mode.</p>
67 | <h2>64-Bit Mode Exceptions</h2>
68 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/SAHF.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>SAHF—Store AH into Flags </title></head>
 8 | <body>
 9 | <h1>SAHF—Store AH into Flags</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode*</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>9E</td>
20 | <td>SAHF</td>
21 | <td>NP</td>
22 | <td>Invalid*</td>
23 | <td>Valid</td>
24 | <td>Loads SF, ZF, AF, PF, and CF from AH into EFLAGS register.</td></tr></table>
25 | <p><strong>NOTES: * Valid in specific steppings. See Description section.</strong></p>
26 | <h3>Instruction Operand Encoding</h3>
27 | <table>
28 | <tr>
29 | <td>Op/En</td>
30 | <td>Operand 1</td>
31 | <td>Operand 2</td>
32 | <td>Operand 3</td>
33 | <td>Operand 4</td></tr>
34 | <tr>
35 | <td>NP</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td>
39 | <td>NA</td></tr></table>
40 | <h2>Description</h2>
41 | <p>Loads the SF, ZF, AF, PF, and CF flags of the EFLAGS register with values from the corresponding bits in the AH register (bits 7, 6, 4, 2, and 0, respectively). Bits 1, 3, and 5 of register AH are ignored; the corresponding reserved bits (1, 3, and 5) in the EFLAGS register remain as shown in the “Operation” section below.</p>
42 | <p>This instruction executes as described above in compatibility mode and legacy mode. It is valid in 64-bit mode only if CPUID.80000001H:ECX.LAHF-SAHF[bit 0] = 1.</p>
43 | <h2>Operation</h2>
44 | <pre>IF IA-64 Mode
45 |     THEN
46 |          IF CPUID.80000001H.ECX[0] = 1;
47 |               THEN
48 |                     RFLAGS(SF:ZF:0:AF:0:PF:1:CF) ← AH;
49 |               ELSE
50 |                     #UD;
51 |          FI
52 |     ELSE
53 |          EFLAGS(SF:ZF:0:AF:0:PF:1:CF) ← AH;
54 | FI;</pre>
55 | <h2>Flags Affected</h2>
56 | <p>The SF, ZF, AF, PF, and CF flags are loaded with values from the AH register. Bits 1, 3, and 5 of the EFLAGS register are unaffected, with the values remaining 1, 0, and 0, respectively.</p>
57 | <h2>Protected Mode Exceptions</h2>
58 | <p>None.</p>
59 | <h2>Real-Address Mode Exceptions</h2>
60 | <p>None.</p>
61 | <h2>Virtual-8086 Mode Exceptions</h2>
62 | <p>None.</p>
63 | <h2>Compatibility Mode Exceptions</h2>
64 | <p>None.</p>
65 | <h2>64-Bit Mode Exceptions</h2>
66 | <table class="exception-table">
67 | <tr>
68 | <td>#UD</td>
69 | <td>
70 | <p>If CPUID.80000001H.ECX[0] = 0.</p>
71 | <p>If the LOCK prefix is used.</p></td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/SFENCE.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>SFENCE—Store Fence </title></head>
 8 | <body>
 9 | <h1>SFENCE—Store Fence</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode*</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F AE F8</td>
20 | <td>SFENCE</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Serializes store operations.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Performs a serializing operation on all store-to-memory instructions that were issued prior the SFENCE instruction. This serializing operation guarantees that every store instruction that precedes the SFENCE instruction in program order becomes globally visible before any store instruction that follows the SFENCE instruction. The SFENCE instruction is ordered with respect to store instructions, other SFENCE instructions, any LFENCE and MFENCE instructions, and any serializing instructions (such as the CPUID instruction). It is not ordered with respect to load instructions.</p>
41 | <p>Weakly ordered memory types can be used to achieve higher processor performance through such techniques as out-of-order issue, write-combining, and write-collapsing. The degree to which a consumer of data recognizes or knows that the data is weakly ordered varies among applications and may be unknown to the producer of this data. The SFENCE instruction provides a performance-efficient way of ensuring store ordering between routines that produce weakly-ordered results and routines that consume this data.</p>
42 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
43 | <p>Specification of the instruction's opcode above indicates a ModR/M byte of F8. For this instruction, the processor ignores the r/m field of the ModR/M byte. Thus, SFENCE is encoded by any opcode of the form 0F AE Fx, where x is in the range 8-F.</p>
44 | <h2>Operation</h2>
45 | <pre>Wait_On_Following_Stores_Until(preceding_stores_globally_visible);</pre>
46 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
47 | <p>void _mm_sfence(void)</p>
48 | <h2>Exceptions (All Operating Modes)</h2>
49 | <p>#UD</p>
50 | <p>If CPUID.01H:EDX.SSE[bit 25] = 0.</p>
51 | <p>If the LOCK prefix is used.</p></body></html>


--------------------------------------------------------------------------------
/html/SHA1MSG1.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>SHA1MSG1—Perform an Intermediate Calculation for the Next Four SHA1 Message Dwords </title></head>
 8 | <body>
 9 | <h1>SHA1MSG1—Perform an Intermediate Calculation for the Next Four SHA1 Message Dwords</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 38 C9 /r</p>
20 | <p>SHA1MSG1 xmm1, xmm2/m128</p></td>
21 | <td>RM</td>
22 | <td>V/V</td>
23 | <td>SHA</td>
24 | <td>Performs an intermediate calculation for the next four SHA1 message dwords using previous message dwords from xmm1 and xmm2/m128, storing the result in xmm1.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td></tr>
32 | <tr>
33 | <td>RM</td>
34 | <td>ModRM:reg (r, w)</td>
35 | <td>ModRM:r/m (r)</td>
36 | <td>NA</td></tr></table>
37 | <p><strong>Description</strong></p>
38 | <p>The SHA1MSG1 instruction is one of two SHA1 message scheduling instructions. The instruction performs an inter-mediate calculation for the next four SHA1 message dwords.</p>
39 | <p><strong>Operation</strong></p>
40 | <p><strong>SHA1MSG1</strong></p>
41 | <p>W0 (cid:197) SRC1[127:96] ;</p>
42 | <p>W1 (cid:197) SRC1[95:64] ;</p>
43 | <p>W2 (cid:197) SRC1[63: 32] ;</p>
44 | <p>W3 (cid:197) SRC1[31: 0] ;</p>
45 | <p>W4 (cid:197) SRC2[127:96] ;</p>
46 | <p>W5 (cid:197) SRC2[95:64] ;</p>
47 | <p>DEST[127:96] (cid:197) W2 XOR W0;</p>
48 | <p>DEST[95:64] (cid:197) W3 XOR W1;</p>
49 | <p>DEST[63:32] (cid:197) W4 XOR W2;</p>
50 | <p>DEST[31:0] (cid:197) W5 XOR W3;</p>
51 | <p><strong>Intel C/C++ Compiler Intrinsic Equivalent</strong></p>
52 | <p>SHA1MSG1: __m128i _mm_sha1msg1_epu32(__m128i, __m128i);</p>
53 | <p><strong>Flags Affected</strong></p>
54 | <p>None</p>
55 | <p><strong>SIMD Floating-Point Exceptions</strong></p>
56 | <p>None</p>
57 | <p><strong>Other Exceptions</strong></p>
58 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/SHA1MSG2.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>SHA1MSG2—Perform a Final Calculation for the Next Four SHA1 Message Dwords </title></head>
 8 | <body>
 9 | <h1>SHA1MSG2—Perform a Final Calculation for the Next Four SHA1 Message Dwords</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 38 CA /r</p>
20 | <p>SHA1MSG2 xmm1, xmm2/m128</p></td>
21 | <td>RM</td>
22 | <td>V/V</td>
23 | <td>SHA</td>
24 | <td>Performs the final calculation for the next four SHA1 message dwords using intermediate results from xmm1 and the previous message dwords from xmm2/m128, storing the result in xmm1.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td></tr>
32 | <tr>
33 | <td>RM</td>
34 | <td>ModRM:reg (r, w)</td>
35 | <td>ModRM:r/m (r)</td>
36 | <td>NA</td></tr></table>
37 | <p><strong>Description</strong></p>
38 | <p>The SHA1MSG2 instruction is one of two SHA1 message scheduling instructions. The instruction performs the final calculation to derive the next four SHA1 message dwords.</p>
39 | <p><strong>Operation</strong></p>
40 | <p><strong>SHA1MSG2</strong></p>
41 | <p>W13 (cid:197) SRC2[95:64] ;</p>
42 | <p>W14 (cid:197) SRC2[63: 32] ;</p>
43 | <p>W15 (cid:197) SRC2[31: 0] ;</p>
44 | <p>W16 (cid:197) (SRC1[127:96] XOR W13 ) ROL 1;</p>
45 | <p>W17 (cid:197) (SRC1[95:64] XOR W14) ROL 1;</p>
46 | <p>W18 (cid:197) (SRC1[63: 32] XOR W15) ROL 1;</p>
47 | <p>W19 (cid:197) (SRC1[31: 0] XOR W16) ROL 1;</p>
48 | <p>DEST[127:96] (cid:197) W16;</p>
49 | <p>DEST[95:64] (cid:197) W17;</p>
50 | <p>DEST[63:32] (cid:197) W18;</p>
51 | <p>DEST[31:0] (cid:197) W19;</p>
52 | <p><strong>Intel C/C++ Compiler Intrinsic Equivalent</strong></p>
53 | <p>SHA1MSG2: __m128i _mm_sha1msg2_epu32(__m128i, __m128i);</p>
54 | <p><strong>Flags Affected</strong></p>
55 | <p>None</p>
56 | <p><strong>SIMD Floating-Point Exceptions</strong></p>
57 | <p>None</p>
58 | <p><strong>Other Exceptions</strong></p>
59 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/SHA1NEXTE.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>SHA1NEXTE—Calculate SHA1 State Variable E after Four Rounds </title></head>
 8 | <body>
 9 | <h1>SHA1NEXTE—Calculate SHA1 State Variable E after Four Rounds</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 38 C8 /r</p>
20 | <p>SHA1NEXTE xmm1, xmm2/m128</p></td>
21 | <td>RM</td>
22 | <td>V/V</td>
23 | <td>SHA</td>
24 | <td>Calculates SHA1 state variable E after four rounds of operation from the current SHA1 state variable A in xmm1. The calculated value of the SHA1 state variable E is added to the scheduled dwords in xmm2/m128, and stored with some of the scheduled dwords in xmm1.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td></tr>
32 | <tr>
33 | <td>RM</td>
34 | <td>ModRM:reg (r, w)</td>
35 | <td>ModRM:r/m (r)</td>
36 | <td>NA</td></tr></table>
37 | <p><strong>Description</strong></p>
38 | <p>The SHA1NEXTE calculates the SHA1 state variable E after four rounds of operation from the current SHA1 state variable A in the destination operand. The calculated value of the SHA1 state variable E is added to the source operand, which contains the scheduled dwords.</p>
39 | <p><strong>Operation</strong></p>
40 | <p><strong>SHA1NEXTE</strong></p>
41 | <p>TMP (cid:197) (SRC1[127:96] ROL 30);</p>
42 | <p>DEST[127:96] (cid:197) SRC2[127:96] + TMP;</p>
43 | <p>DEST[95:64] (cid:197) SRC2[95:64];</p>
44 | <p>DEST[63:32] (cid:197) SRC2[63:32];</p>
45 | <p>DEST[31:0] (cid:197) SRC2[31:0];</p>
46 | <p><strong>Intel C/C++ Compiler Intrinsic Equivalent</strong></p>
47 | <p>SHA1NEXTE: __m128i _mm_sha1nexte_epu32(__m128i, __m128i);</p>
48 | <p><strong>Flags Affected</strong></p>
49 | <p>None</p>
50 | <p><strong>SIMD Floating-Point Exceptions</strong></p>
51 | <p>None</p>
52 | <p><strong>Other Exceptions</strong></p>
53 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/SHA256MSG1.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>SHA256MSG1—Perform an Intermediate Calculation for the Next Four SHA256 Message Dwords </title></head>
 8 | <body>
 9 | <h1>SHA256MSG1—Perform an Intermediate Calculation for the Next Four SHA256 Message Dwords</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 38 CC /r</p>
20 | <p>SHA256MSG1 xmm1, xmm2/m128</p></td>
21 | <td>RM</td>
22 | <td>V/V</td>
23 | <td>SHA</td>
24 | <td>Performs an intermediate calculation for the next four SHA256 message dwords using previous message dwords from xmm1 and xmm2/m128, storing the result in xmm1.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td></tr>
32 | <tr>
33 | <td>RM</td>
34 | <td>ModRM:reg (r, w)</td>
35 | <td>ModRM:r/m (r)</td>
36 | <td>NA</td></tr></table>
37 | <p><strong>Description</strong></p>
38 | <p>The SHA256MSG1 instruction is one of two SHA256 message scheduling instructions. The instruction performs an intermediate calculation for the next four SHA256 message dwords.</p>
39 | <p><strong>Operation</strong></p>
40 | <p><strong>SHA256MSG1</strong></p>
41 | <p>W4 (cid:197) SRC2[31: 0] ;</p>
42 | <p>W3 (cid:197) SRC1[127:96] ;</p>
43 | <p>W2 (cid:197) SRC1[95:64] ;</p>
44 | <p>W1 (cid:197) SRC1[63: 32] ;</p>
45 | <p>W0 (cid:197) SRC1[31: 0] ;</p>
46 | <p>DEST[127:96] (cid:197) W3 + σ<sub>0</sub>( W4);</p>
47 | <p>DEST[95:64] (cid:197) W2 + σ<sub>0</sub>( W3);</p>
48 | <p>DEST[63:32] (cid:197) W1 + σ<sub>0</sub>( W2);</p>
49 | <p>DEST[31:0] (cid:197) W0 + σ<sub>0</sub>( W1);</p>
50 | <p><strong>Intel C/C++ Compiler Intrinsic Equivalent</strong></p>
51 | <p>SHA256MSG1: __m128i _mm_sha256msg1_epu32(__m128i, __m128i);</p>
52 | <p><strong>Flags Affected</strong></p>
53 | <p>None</p>
54 | <p><strong>SIMD Floating-Point Exceptions</strong></p>
55 | <p>None</p>
56 | <p><strong>Other Exceptions</strong></p>
57 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/SHA256MSG2.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>SHA256MSG2—Perform a Final Calculation for the Next Four SHA256 Message Dwords </title></head>
 8 | <body>
 9 | <h1>SHA256MSG2—Perform a Final Calculation for the Next Four SHA256 Message Dwords</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 38 CD /r</p>
20 | <p>SHA256MSG2 xmm1, xmm2/m128</p></td>
21 | <td>RM</td>
22 | <td>V/V</td>
23 | <td>SHA</td>
24 | <td>Performs the final calculation for the next four SHA256 message dwords using previous message dwords from xmm1 and xmm2/m128, storing the result in xmm1.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td></tr>
32 | <tr>
33 | <td>RM</td>
34 | <td>ModRM:reg (r, w)</td>
35 | <td>ModRM:r/m (r)</td>
36 | <td>NA</td></tr></table>
37 | <p><strong>Description</strong></p>
38 | <p>The SHA256MSG2 instruction is one of two SHA2 message scheduling instructions. The instruction performs the final calculation for the next four SHA256 message dwords.</p>
39 | <p><strong>Operation</strong></p>
40 | <p><strong>SHA256MSG2</strong></p>
41 | <p>W14 (cid:197) SRC2[95:64] ;</p>
42 | <p>W15 (cid:197) SRC2[127:96] ;</p>
43 | <p>W16 (cid:197) SRC1[31: 0] + σ<sub>1</sub>( W14) ;</p>
44 | <p>W17 (cid:197) SRC1[63: 32] + σ<sub>1</sub>( W15) ;</p>
45 | <p>W18 (cid:197) SRC1[95: 64] + σ<sub>1</sub>( W16) ;</p>
46 | <p>W19 (cid:197) SRC1[127: 96] + σ<sub>1</sub>( W17) ;</p>
47 | <p>DEST[127:96] (cid:197) W19 ;</p>
48 | <p>DEST[95:64] (cid:197) W18 ;</p>
49 | <p>DEST[63:32] (cid:197) W17 ;</p>
50 | <p>DEST[31:0] (cid:197) W16;</p>
51 | <p><strong>Intel C/C++ Compiler Intrinsic Equivalent</strong></p>
52 | <p>SHA256MSG2 : __m128i _mm_sha256msg2_epu32(__m128i, __m128i);</p>
53 | <p><strong>Flags Affected</strong></p>
54 | <p>None</p>
55 | <p><strong>SIMD Floating-Point Exceptions</strong></p>
56 | <p>None</p>
57 | <p><strong>Other Exceptions</strong></p>
58 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/SHA256RNDS2.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>SHA256RNDS2—Perform Two Rounds of SHA256 Operation </title></head>
 8 | <body>
 9 | <h1>SHA256RNDS2—Perform Two Rounds of SHA256 Operation</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 38 CB /r</p>
20 | <p>SHA256RNDS2 xmm1, xmm2/m128, &lt;XMM0&gt;</p></td>
21 | <td>RM0</td>
22 | <td>V/V</td>
23 | <td>SHA</td>
24 | <td>Perform 2 rounds of SHA256 operation using an initial SHA256 state (C,D,G,H) from xmm1, an initial SHA256 state (A,B,E,F) from xmm2/m128, and a pre-computed sum of the next 2 round mes-sage dwords and the corresponding round constants from the implicit operand XMM0, storing the updated SHA256 state (A,B,E,F) result in xmm1.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td></tr>
32 | <tr>
33 | <td>RMI</td>
34 | <td>ModRM:reg (r, w)</td>
35 | <td>ModRM:r/m (r)</td>
36 | <td>Implicit XMM0 (r)</td></tr></table>
37 | <p><strong>Description</strong></p>
38 | <p>The SHA256RNDS2 instruction performs 2 rounds of SHA256 operation using an initial SHA256 state (C,D,G,H) from the first operand, an initial SHA256 state (A,B,E,F) from the second operand, and a pre-computed sum of the next 2 round message dwords and the corresponding round constants from the implicit operand xmm0. Note that only the two lower dwords of XMM0 are used by the instruction.</p>
39 | <p>The updated SHA256 state (A,B,E,F) is written to the first operand, and the second operand can be used as the updated state (C,D,G,H) in later rounds.</p>
40 | <p><strong>Operation</strong></p>
41 | <p><strong>SHA256RNDS2</strong></p>
42 | <p>A_0 (cid:197) SRC2[127:96];</p>
43 | <p>B_0 (cid:197) SRC2[95:64];</p>
44 | <p>C_0 (cid:197) SRC1[127:96];</p>
45 | <p>D_0 (cid:197) SRC1[95:64];</p>
46 | <p>E_0 (cid:197) SRC2[63:32];</p>
47 | <p>F_0 (cid:197) SRC2[31:0];</p>
48 | <p>G_0 (cid:197) SRC1[63:32];</p>
49 | <p>H_0 (cid:197) SRC1[31:0];</p>
50 | <p>WK<sub>0</sub> (cid:197) XMM0[31: 0];</p>
51 | <p>WK<sub>1</sub> (cid:197) XMM0[63: 32];</p>
52 | <p>FOR i = 0 to 1</p>
53 | <p>A_(i +1) (cid:197) Ch (E_i, F_i, G_i) +Σ<sub>1</sub>( E_i) +WK<sub>i</sub>+ H_i + Maj(A_i , B_i, C_i) +Σ<sub>0</sub>( A_i);</p>
54 | <p>B_(i +1) (cid:197) A_i;</p>
55 | <p>C_(i +1) (cid:197) B_i ;</p>
56 | <p>D_(i +1) (cid:197) C_i;</p>
57 | <p>E_(i +1) (cid:197) Ch (E_i, F_i, G_i) +Σ<sub>1</sub>( E_i) +WK<sub>i</sub>+ H_i + D_i;</p>
58 | <p>F_(i +1) (cid:197) E_i ;</p>
59 | <p>G_(i +1) (cid:197) F_i;</p>
60 | <p>H_(i +1) (cid:197) G_i;</p>
61 | <p>ENDFOR</p>
62 | <p>DEST[127:96] (cid:197) A_2;</p>
63 | <p>DEST[95:64] (cid:197) B_2;</p>
64 | <p>DEST[63:32] (cid:197) E_2;</p>
65 | <p>DEST[31:0] (cid:197) F_2;</p>
66 | <p><strong>Intel C/C++ Compiler Intrinsic Equivalent</strong></p>
67 | <p>SHA256RNDS2: __m128i _mm_sha256rnds2_epu32(__m128i, __m128i, __m128i);</p>
68 | <p><strong>Flags Affected</strong></p>
69 | <p>None</p>
70 | <p><strong>SIMD Floating-Point Exceptions</strong></p>
71 | <p>None</p>
72 | <p><strong>Other Exceptions</strong></p>
73 | <p>See Exceptions Type 4.</p></body></html>


--------------------------------------------------------------------------------
/html/STAC.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>STAC—Set AC Flag in EFLAGS Register </title></head>
 8 | <body>
 9 | <h1>STAC—Set AC Flag in EFLAGS Register</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F 01 CB</td>
20 | <td>STAC</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Set the AC flag in the EFLAGS register.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Sets the AC flag bit in EFLAGS register. This may enable alignment checking of user-mode data accesses. This allows explicit supervisor-mode data accesses to user-mode pages even if the SMAP bit is set in the CR4 register.</p>
41 | <p>This instruction's operation is the same in non-64-bit modes and 64-bit mode. Attempts to execute STAC when CPL &gt; 0 cause #UD.</p>
42 | <h2>Operation</h2>
43 | <pre>EFLAGS.AC ← 1;</pre>
44 | <h2>Flags Affected</h2>
45 | <p>AC set. Other flags are unaffected.</p>
46 | <h2>Protected Mode Exceptions</h2>
47 | <table class="exception-table">
48 | <tr>
49 | <td>#UD</td>
50 | <td>
51 | <p>If the LOCK prefix is used.</p>
52 | <p>If the CPL &gt; 0.</p>
53 | <p>If CPUID.(EAX=07H, ECX=0H):EBX.SMAP[bit 20] = 0.</p></td></tr></table>
54 | <h2>Real-Address Mode Exceptions</h2>
55 | <table class="exception-table">
56 | <tr>
57 | <td>#UD</td>
58 | <td>
59 | <p>If the LOCK prefix is used.</p>
60 | <p>If CPUID.(EAX=07H, ECX=0H):EBX.SMAP[bit 20] = 0.</p></td></tr></table>
61 | <h2>Virtual-8086 Mode Exceptions</h2>
62 | <table class="exception-table">
63 | <tr>
64 | <td>#UD</td>
65 | <td>The STAC instruction is not recognized in virtual-8086 mode.</td></tr></table>
66 | <h2>Compatibility Mode Exceptions</h2>
67 | <table class="exception-table">
68 | <tr>
69 | <td>#UD</td>
70 | <td>
71 | <p>If the LOCK prefix is used.</p>
72 | <p>If the CPL &gt; 0.</p>
73 | <p>If CPUID.(EAX=07H, ECX=0H):EBX.SMAP[bit 20] = 0.</p></td></tr></table>
74 | <h2>64-Bit Mode Exceptions</h2>
75 | <table class="exception-table">
76 | <tr>
77 | <td>#UD</td>
78 | <td>
79 | <p>If the LOCK prefix is used.</p>
80 | <p>If the CPL &gt; 0.</p>
81 | <p>If CPUID.(EAX=07H, ECX=0H):EBX.SMAP[bit 20] = 0.</p></td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/STC.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>STC—Set Carry Flag </title></head>
 8 | <body>
 9 | <h1>STC—Set Carry Flag</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>F9</td>
20 | <td>STC</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Set CF flag.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Sets the CF flag in the EFLAGS register. Operation is the same in all modes.</p>
41 | <h2>Operation</h2>
42 | <pre>CF ← 1;</pre>
43 | <h2>Flags Affected</h2>
44 | <p>The CF flag is set. The OF, ZF, SF, AF, and PF flags are unaffected.</p>
45 | <h2>Exceptions (All Operating Modes)</h2>
46 | <p>#UD</p>
47 | <p>If the LOCK prefix is used.</p></body></html>


--------------------------------------------------------------------------------
/html/STD.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>STD—Set Direction Flag </title></head>
 8 | <body>
 9 | <h1>STD—Set Direction Flag</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>FD</td>
20 | <td>STD</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Set DF flag.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Sets the DF flag in the EFLAGS register. When the DF flag is set to 1, string operations decrement the index regis-ters (ESI and/or EDI). Operation is the same in all modes.</p>
41 | <h2>Operation</h2>
42 | <pre>DF ← 1;</pre>
43 | <h2>Flags Affected</h2>
44 | <p>The DF flag is set. The CF, OF, ZF, SF, AF, and PF flags are unaffected.</p>
45 | <h2>Exceptions (All Operating Modes)</h2>
46 | <p>#UD</p>
47 | <p>If the LOCK prefix is used.</p></body></html>


--------------------------------------------------------------------------------
/html/STMXCSR.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>STMXCSR—Store MXCSR Register State </title></head>
 8 | <body>
 9 | <h1>STMXCSR—Store MXCSR Register State</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode*/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F AE /3</p>
20 | <p>STMXCSR <em>m32</em></p></td>
21 | <td>M</td>
22 | <td>V/V</td>
23 | <td>SSE</td>
24 | <td>Store contents of MXCSR register to <em>m32</em>.</td></tr>
25 | <tr>
26 | <td>
27 | <p>VEX.LZ.0F.WIG AE /3</p>
28 | <p>VSTMXCSR <em>m32</em></p></td>
29 | <td>M</td>
30 | <td>V/V</td>
31 | <td>AVX</td>
32 | <td>Store contents of MXCSR register to <em>m32</em>.</td></tr></table>
33 | <h3>Instruction Operand Encoding</h3>
34 | <table>
35 | <tr>
36 | <td>Op/En</td>
37 | <td>Operand 1</td>
38 | <td>Operand 2</td>
39 | <td>Operand 3</td>
40 | <td>Operand 4</td></tr>
41 | <tr>
42 | <td>M</td>
43 | <td>ModRM:r/m (w)</td>
44 | <td>NA</td>
45 | <td>NA</td>
46 | <td>NA</td></tr></table>
47 | <h2>Description</h2>
48 | <p>Stores the contents of the MXCSR control and status register to the destination operand. The destination operand is a 32-bit memory location. The reserved bits in the MXCSR register are stored as 0s.</p>
49 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
50 | <p>VEX.L must be 0, otherwise instructions will #UD.</p>
51 | <p>Note: In VEX-encoded versions, VEX.vvvv is reserved and must be 1111b, otherwise instructions will #UD.</p>
52 | <h2>Operation</h2>
53 | <pre>m32 ← MXCSR;</pre>
54 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
55 | <p>_mm_getcsr(void)</p>
56 | <h2>SIMD Floating-Point Exceptions</h2>
57 | <p>None.</p>
58 | <h2>Other Exceptions</h2>
59 | <p>See Exceptions Type 5; additionally</p>
60 | <table class="exception-table">
61 | <tr>
62 | <td>#UD</td>
63 | <td>
64 | <p>If VEX.L= 1,</p>
65 | <p>If VEX.vvvv ≠ 1111B.</p></td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/UD2.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>UD2—Undefined Instruction </title></head>
 8 | <body>
 9 | <h1>UD2—Undefined Instruction</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F 0B</td>
20 | <td>UD2</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Raise invalid opcode exception.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Generates an invalid opcode exception. This instruction is provided for software testing to explicitly generate an invalid opcode exception. The opcode for this instruction is reserved for this purpose.</p>
41 | <p>Other than raising the invalid opcode exception, this instruction has no effect on processor state or memory.</p>
42 | <p>Even though it is the execution of the UD2 instruction that causes the invalid opcode exception, the instruction pointer saved by delivery of the exception references the UD2 instruction (and not the following instruction).</p>
43 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
44 | <h2>Operation</h2>
45 | <pre>#UD (* Generates invalid opcode exception *);</pre>
46 | <h2>Flags Affected</h2>
47 | <p>None.</p>
48 | <h2>Exceptions (All Operating Modes)</h2>
49 | <p>#UD</p>
50 | <p>Raises an invalid opcode exception in all operating modes.</p></body></html>


--------------------------------------------------------------------------------
/html/VPERM2F128.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>VPERM2F128 — Permute Floating-Point Values </title></head>
 8 | <body>
 9 | <h1>VPERM2F128 — Permute Floating-Point Values</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>VEX.NDS.256.66.0F3A.W0 06 /r ib VPERM2F128 <em>ymm1, ymm2, ymm3/m256, imm8</em></td>
19 | <td>RVMI</td>
20 | <td>V/V</td>
21 | <td>AVX</td>
22 | <td>Permute 128-bit floating-point fields in <em>ymm2 </em>and <em>ymm3/mem</em> using controls from <em>imm8</em> and store result in <em>ymm1</em>.</td></tr></table>
23 | <h3>Instruction Operand Encoding</h3>
24 | <table>
25 | <tr>
26 | <td>Op/En</td>
27 | <td>Operand 1</td>
28 | <td>Operand 2</td>
29 | <td>Operand 3</td>
30 | <td>Operand 4</td></tr>
31 | <tr>
32 | <td>RVMI</td>
33 | <td>ModRM:reg (w)</td>
34 | <td>VEX.vvvv (r)</td>
35 | <td>ModRM:r/m (r)</td>
36 | <td>imm8</td></tr></table>
37 | <h2>Description</h2>
38 | <p>Permute 128 bit floating-point-containing fields from the first source operand (second operand) and second source operand (third operand) using bits in the 8-bit immediate and store results in the destination operand (first operand). The first source operand is a YMM register, the second source operand is a YMM register or a 256-bit memory location, and the destination operand is a YMM register.</p>
39 | <p>Y1</p>
40 | <p>Y0</p>
41 | <p>SRC2</p>
42 | <p>X1</p>
43 | <p>X0</p>
44 | <p>SRC1</p>
45 | <p>X0, X1, Y0, or Y1</p>
46 | <p>DEST</p>
47 | <p>X0, X1, Y0, or Y1</p>
48 | <h3>Figure 5-21.  VPERM2F128 Operation</h3>
49 | <p>Imm8[1:0] select the source for the first destination 128-bit field, imm8[5:4] select the source for the second destination field. If imm8[3] is set, the low 128-bit field is zeroed. If imm8[7] is set, the high 128-bit field is zeroed.</p>
50 | <p>VEX.L must be 1, otherwise the instruction will #UD.</p>
51 | <h2>Operation</h2>
52 | <p><strong>VPERM2F128</strong></p>
53 | <pre>CASE IMM8[1:0] of
54 | 0: DEST[127:0] (cid:197) SRC1[127:0]
55 | 1: DEST[127:0] (cid:197) SRC1[255:128]
56 | 2: DEST[127:0] (cid:197) SRC2[127:0]
57 | 3: DEST[127:0] (cid:197) SRC2[255:128]
58 | ESAC
59 | CASE IMM8[5:4] of
60 | 0: DEST[255:128] (cid:197) SRC1[127:0]
61 | 1: DEST[255:128] (cid:197) SRC1[255:128]
62 | 2: DEST[255:128] (cid:197) SRC2[127:0]
63 | 3: DEST[255:128] (cid:197) SRC2[255:128]
64 | ESAC
65 | IF (imm8[3])
66 | DEST[127:0] (cid:197) 0
67 | FI
68 | IF (imm8[7])
69 | DEST[VLMAX-1:128] (cid:197) 0
70 | FI</pre>
71 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
72 | <p>VPERM2F128:</p>
73 | <p> __m256 _mm256_permute2f128_ps (__m256 a, __m256 b, int control)</p>
74 | <p>VPERM2F128:</p>
75 | <p> __m256d _mm256_permute2f128_pd (__m256d a, __m256d b, int control)</p>
76 | <p>VPERM2F128:</p>
77 | <p> __m256i _mm256_permute2f128_si256 (__m256i a, __m256i b, int control)</p>
78 | <h2>SIMD Floating-Point Exceptions</h2>
79 | <p>None.</p>
80 | <h2>Other Exceptions</h2>
81 | <p>See Exceptions Type 6; additionally</p>
82 | <table class="exception-table">
83 | <tr>
84 | <td>#UD</td>
85 | <td>
86 | <p>If VEX.L = 0</p>
87 | <p>If VEX.W = 1.</p></td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/VPERM2I128.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>VPERM2I128 — Permute Integer Values </title></head>
 8 | <body>
 9 | <h1>VPERM2I128 — Permute Integer Values</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 -bit Mode</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>VEX.NDS.256.66.0F3A.W0 46 /r ib</p>
20 | <p>VPERM2I128 <em>ymm1, ymm2, ymm3/m256, imm8</em></p></td>
21 | <td>RVMI</td>
22 | <td>V/V</td>
23 | <td>AVX2</td>
24 | <td>Permute 128-bit integer data in <em>ymm2</em> and <em>ymm3/mem</em> using controls from <em>imm8</em> and store result in <em>ymm1</em>.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>RVMI</td>
35 | <td>ModRM:reg (w)</td>
36 | <td>VEX.vvvv</td>
37 | <td>ModRM:r/m (r)</td>
38 | <td>Imm8</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Permute 128 bit integer data from the first source operand (second operand) and second source operand (third operand) using bits in the 8-bit immediate and store results in the destination operand (first operand). The first source operand is a YMM register, the second source operand is a YMM register or a 256-bit memory location, and the destination operand is a YMM register.</p>
41 | <p>Y1</p>
42 | <p>Y0</p>
43 | <p>SRC2</p>
44 | <p>X1</p>
45 | <p>X0</p>
46 | <p>SRC1</p>
47 | <p>X0, X1, Y0, or Y1</p>
48 | <p>DEST</p>
49 | <p>X0, X1, Y0, or Y1</p>
50 | <h3>Figure 5-22.  VPERM2I128 Operation</h3>
51 | <p>Imm8[1:0] select the source for the first destination 128-bit field, imm8[5:4] select the source for the second destination field. If imm8[3] is set, the low 128-bit field is zeroed. If imm8[7] is set, the high 128-bit field is zeroed.</p>
52 | <p>VEX.L must be 1, otherwise the instruction will #UD.</p>
53 | <h2>Operation</h2>
54 | <p><strong>VPERM2I128</strong></p>
55 | <pre>CASE IMM8[1:0] of
56 | 0: DEST[127:0] (cid:197) SRC1[127:0]
57 | 1: DEST[127:0] (cid:197) SRC1[255:128]
58 | 2: DEST[127:0] (cid:197) SRC2[127:0]
59 | 3: DEST[127:0] (cid:197) SRC2[255:128]
60 | ESAC
61 | CASE IMM8[5:4] of
62 | 0: DEST[255:128] (cid:197) SRC1[127:0]
63 | 1: DEST[255:128] (cid:197) SRC1[255:128]
64 | 2: DEST[255:128] (cid:197) SRC2[127:0]
65 | 3: DEST[255:128] (cid:197) SRC2[255:128]
66 | ESAC
67 | IF (imm8[3])
68 | DEST[127:0] (cid:197) 0
69 | FI
70 | IF (imm8[7])
71 | DEST[255:128] (cid:197) 0
72 | FI</pre>
73 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
74 | <p>VPERM2I128: __m256i _mm256_permute2x128_si256 (__m256i a, __m256i b, int control)</p>
75 | <h2>SIMD Floating-Point Exceptions</h2>
76 | <p>None</p>
77 | <h2>Other Exceptions</h2>
78 | <p>See Exceptions Type 6; additionally</p>
79 | <table class="exception-table">
80 | <tr>
81 | <td>#UD</td>
82 | <td>
83 | <p>If VEX.L = 0,</p>
84 | <p>If VEX.W = 1.</p></td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/VZEROALL.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>VZEROALL—Zero All YMM Registers </title></head>
 8 | <body>
 9 | <h1>VZEROALL—Zero All YMM Registers</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>VEX.256.0F.WIG 77</p>
20 | <p>VZEROALL</p></td>
21 | <td>NP</td>
22 | <td>V/V</td>
23 | <td>AVX</td>
24 | <td>Zero all YMM registers.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>The instruction zeros contents of all XMM or YMM registers.</p>
41 | <p>Note: VEX.vvvv is reserved and must be 1111b, otherwise instructions will #UD. In Compatibility and legacy 32-bit mode only the lower 8 registers are modified.</p>
42 | <h2>Operation</h2>
43 | <p><strong>VZEROALL (VEX.256 encoded version)</strong></p>
44 | <pre>IF (64-bit mode)
45 |     YMM0[VLMAX-1:0] (cid:197) 0
46 |     YMM1[VLMAX-1:0] (cid:197) 0
47 |     YMM2[VLMAX-1:0] (cid:197) 0
48 |     YMM3[VLMAX-1:0] (cid:197) 0
49 |     YMM4[VLMAX-1:0] (cid:197) 0
50 |     YMM5[VLMAX-1:0] (cid:197) 0
51 |     YMM6[VLMAX-1:0] (cid:197) 0
52 |     YMM7[VLMAX-1:0] (cid:197) 0
53 |     YMM8[VLMAX-1:0] (cid:197) 0
54 |     YMM9[VLMAX-1:0] (cid:197) 0
55 |     YMM10[VLMAX-1:0] (cid:197) 0
56 |     YMM11[VLMAX-1:0] (cid:197) 0
57 |     YMM12[VLMAX-1:0] (cid:197) 0
58 |     YMM13[VLMAX-1:0] (cid:197) 0
59 |     YMM14[VLMAX-1:0] (cid:197) 0
60 |     YMM15[VLMAX-1:0] (cid:197) 0
61 | ELSE
62 |     YMM0[VLMAX-1:0] (cid:197) 0
63 |     YMM1[VLMAX-1:0] (cid:197) 0
64 |     YMM2[VLMAX-1:0] (cid:197) 0
65 |     YMM3[VLMAX-1:0] (cid:197) 0
66 |     YMM4[VLMAX-1:0] (cid:197) 0
67 |     YMM5[VLMAX-1:0] (cid:197) 0
68 |     YMM6[VLMAX-1:0] (cid:197) 0
69 |     YMM7[VLMAX-1:0] (cid:197) 0
70 |     YMM8-15: Unmodified
71 | FI</pre>
72 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
73 | <p>VZEROALL:</p>
74 | <p> _mm256_zeroall()</p>
75 | <h2>SIMD Floating-Point Exceptions</h2>
76 | <p>None.</p>
77 | <h2>Other Exceptions</h2>
78 | <p>See Exceptions Type 8.</p></body></html>


--------------------------------------------------------------------------------
/html/VZEROUPPER.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>VZEROUPPER—Zero Upper Bits of YMM Registers </title></head>
 8 | <body>
 9 | <h1>VZEROUPPER—Zero Upper Bits of YMM Registers</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32 bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>VEX.128.0F.WIG 77</p>
20 | <p>VZEROUPPER</p></td>
21 | <td>NP</td>
22 | <td>V/V</td>
23 | <td>AVX</td>
24 | <td>Zero upper 128 bits of all YMM registers.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>The instruction zeros the bits in position 128 and higher of all YMM registers. The lower 128-bits of the registers (the corresponding XMM registers) are unmodified.</p>
41 | <p>This instruction is recommended when transitioning between AVX and legacy SSE code - it will eliminate perfor-mance penalties caused by false dependencies.</p>
42 | <p>Note: VEX.vvvv is reserved and must be 1111b otherwise instructions will #UD. In Compatibility and legacy 32-bit mode only the lower 8 registers are modified.</p>
43 | <h2>Operation</h2>
44 | <p><strong>VZEROUPPER</strong></p>
45 | <pre>IF (64-bit mode)
46 |     YMM0[VLMAX-1:128] (cid:197) 0
47 |     YMM1[VLMAX-1:128] (cid:197) 0
48 |     YMM2[VLMAX-1:128] (cid:197) 0
49 |     YMM3[VLMAX-1:128] (cid:197) 0
50 |     YMM4[VLMAX-1:128] (cid:197) 0
51 |     YMM5[VLMAX-1:128] (cid:197) 0
52 |     YMM6[VLMAX-1:128] (cid:197) 0
53 |     YMM7[VLMAX-1:128] (cid:197) 0
54 |     YMM8[VLMAX-1:128] (cid:197) 0
55 |     YMM9[VLMAX-1:128] (cid:197) 0
56 |     YMM10[VLMAX-1:128] (cid:197) 0
57 |     YMM11[VLMAX-1:128] (cid:197) 0
58 |     YMM12[VLMAX-1:128] (cid:197) 0
59 |     YMM13[VLMAX-1:128] (cid:197) 0
60 |     YMM14[VLMAX-1:128] (cid:197) 0
61 |     YMM15[VLMAX-1:128] (cid:197) 0
62 | ELSE
63 |     YMM0[VLMAX-1:128] (cid:197) 0
64 |     YMM1[VLMAX-1:128] (cid:197) 0
65 |     YMM2[VLMAX-1:128] (cid:197) 0
66 |     YMM3[VLMAX-1:128] (cid:197) 0
67 |     YMM4[VLMAX-1:128] (cid:197) 0
68 |     YMM5[VLMAX-1:128] (cid:197) 0
69 |     YMM6[VLMAX-1:128] (cid:197) 0
70 |     YMM7[VLMAX-1:128] (cid:197) 0
71 |     YMM8-15: unmodified
72 | FI</pre>
73 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
74 | <p>VZEROUPPER:</p>
75 | <p> _mm256_zeroupper()</p>
76 | <h2>SIMD Floating-Point Exceptions</h2>
77 | <p>None.</p>
78 | <h2>Other Exceptions</h2>
79 | <p>See Exceptions Type 8.</p></body></html>


--------------------------------------------------------------------------------
/html/WAIT_FWAIT.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>WAIT/FWAIT—Wait </title></head>
 8 | <body>
 9 | <h1>WAIT/FWAIT—Wait</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64-Bit Mode</th>
16 | <th>Compat/Leg Mode</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>9B</td>
20 | <td>WAIT</td>
21 | <td>NP</td>
22 | <td>Valid</td>
23 | <td>Valid</td>
24 | <td>Check pending unmasked floating-point exceptions.</td></tr>
25 | <tr>
26 | <td>9B</td>
27 | <td>FWAIT</td>
28 | <td>NP</td>
29 | <td>Valid</td>
30 | <td>Valid</td>
31 | <td>Check pending unmasked floating-point exceptions.</td></tr></table>
32 | <h3>Instruction Operand Encoding</h3>
33 | <table>
34 | <tr>
35 | <td>Op/En</td>
36 | <td>Operand 1</td>
37 | <td>Operand 2</td>
38 | <td>Operand 3</td>
39 | <td>Operand 4</td></tr>
40 | <tr>
41 | <td>NP</td>
42 | <td>NA</td>
43 | <td>NA</td>
44 | <td>NA</td>
45 | <td>NA</td></tr></table>
46 | <h2>Description</h2>
47 | <p>Causes the processor to check for and handle pending, unmasked, floating-point exceptions before proceeding. (FWAIT is an alternate mnemonic for WAIT.)</p>
48 | <p>This instruction is useful for synchronizing exceptions in critical sections of code. Coding a WAIT instruction after a floating-point instruction ensures that any unmasked floating-point exceptions the instruction may raise are handled before the processor can modify the instruction’s results. See the section titled “Floating-Point Exception Synchronization” in Chapter 8 of the <em>Intel® 64 and IA-32 Architectures Software Developer’s Manual, Volume 1</em>, for more information on using the WAIT/FWAIT instruction.</p>
49 | <p>This instruction’s operation is the same in non-64-bit modes and 64-bit mode.</p>
50 | <h2>Operation</h2>
51 | <pre>CheckForPendingUnmaskedFloatingPointExceptions;</pre>
52 | <h2>FPU Flags Affected</h2>
53 | <p>The C0, C1, C2, and C3 flags are undefined.</p>
54 | <h2>Floating-Point Exceptions</h2>
55 | <p>None.</p>
56 | <h2>Protected Mode Exceptions</h2>
57 | <table class="exception-table">
58 | <tr>
59 | <td>#NM</td>
60 | <td>If CR0.MP[bit 1] = 1 and CR0.TS[bit 3] = 1.</td></tr>
61 | <tr>
62 | <td>#UD</td>
63 | <td>If the LOCK prefix is used.</td></tr></table>
64 | <h2>Real-Address Mode Exceptions</h2>
65 | <p>Same exceptions as in protected mode.</p>
66 | <h2>Virtual-8086 Mode Exceptions</h2>
67 | <p>Same exceptions as in protected mode.</p>
68 | <h2>Compatibility Mode Exceptions</h2>
69 | <p>Same exceptions as in protected mode.</p>
70 | <h2>64-Bit Mode Exceptions</h2>
71 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/WRPKRU.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>WRPKRU—Write Data to User Page Key Register </title></head>
 8 | <body>
 9 | <h1>WRPKRU—Write Data to User Page Key Register</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode*</th>
13 | <th>Instruction</th>
14 | <th>Op/En</th>
15 | <th>64/32bit Mode Support</th>
16 | <th>CPUID Feature Flag</th>
17 | <th>Description</th></tr>
18 | <tr>
19 | <td>0F 01 EF</td>
20 | <td>WRPKRU</td>
21 | <td>NP</td>
22 | <td>V/V</td>
23 | <td>OSPKE</td>
24 | <td>Writes EAX into PKRU.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand 2</td>
31 | <td>Operand 3</td>
32 | <td>Operand 4</td></tr>
33 | <tr>
34 | <td>NP</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>Writes the value of EAX into PKRU. ECX and EDX must be 0 when WRPKRU is executed; otherwise, a general-protection exception (#GP) occurs.</p>
41 | <p>WRPKRU can be executed only if CR4.PKE = 1; otherwise, an invalid-opcode exception (#UD) occurs. Software can discover the value of CR4.PKE by examining CPUID.(EAX=07H,ECX=0H):ECX.OSPKE [bit 4].</p>
42 | <p>On processors that support the Intel 64 Architecture, the high-order 32-bits of RCX, RDX and RAX are ignored.</p>
43 | <h2>Operation</h2>
44 | <pre>IF (ECX = 0 AND EDX = 0)
45 |     THEN PKRU ← EAX;
46 |     ELSE #GP(0);
47 | FI;</pre>
48 | <h2>Flags Affected</h2>
49 | <p>None.</p>
50 | <h2>C/C++ Compiler Intrinsic Equivalent</h2>
51 | <p>WRPKRU:</p>
52 | <p>void _wrpkru(uint32_t);</p>
53 | <h2>Protected Mode Exceptions</h2>
54 | <table class="exception-table">
55 | <tr>
56 | <td>#GP(0)</td>
57 | <td>
58 | <p>If ECX ≠ 0.</p>
59 | <p>If EDX ≠ 0.</p></td></tr>
60 | <tr>
61 | <td>#UD</td>
62 | <td>
63 | <p>If the LOCK prefix is used.</p>
64 | <p>If CR4.PKE = 0.</p></td></tr></table>
65 | <h2>Real-Address Mode Exceptions</h2>
66 | <p>Same exceptions as in protected mode.</p>
67 | <h2>Virtual-8086 Mode Exceptions</h2>
68 | <p>Same exceptions as in protected mode.</p>
69 | <h2>Compatibility Mode Exceptions</h2>
70 | <p>Same exceptions as in protected mode.</p>
71 | <h2>64-Bit Mode Exceptions</h2>
72 | <p>Same exceptions as in protected mode.</p></body></html>


--------------------------------------------------------------------------------
/html/XABORT.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>XABORT — Transactional Abort </title></head>
 8 | <body>
 9 | <h1>XABORT — Transactional Abort</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>C6 F8 ib</p>
20 | <p>XABORT imm8</p></td>
21 | <td>A</td>
22 | <td>V/V</td>
23 | <td>RTM</td>
24 | <td>Causes an RTM abort if in RTM execution</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand2</td>
31 | <td>Operand3</td>
32 | <td>Operand4</td></tr>
33 | <tr>
34 | <td>A</td>
35 | <td>imm8</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>XABORT forces an RTM abort. Following an RTM abort, the logical processor resumes execution at the fallback address computed through the outermost XBEGIN instruction. The EAX register is updated to reflect an XABORT instruction caused the abort, and the imm8 argument will be provided in bits 31:24 of EAX.</p>
41 | <h2>Operation</h2>
42 | <p><strong>XABORT</strong></p>
43 | <pre>IF RTM_ACTIVE = 0
44 |     THEN
45 |          Treat as NOP;
46 |     ELSE
47 |          GOTO RTM_ABORT_PROCESSING;
48 | FI;
49 | (* For any RTM abort condition encountered during RTM execution *)
50 | RTM_ABORT_PROCESSING:
51 |     Restore architectural register state;
52 |     Discard memory updates performed in transaction;
53 |     Update EAX with status and XABORT argument;
54 |     RTM_NEST_COUNT ← 0;
55 |     RTM_ACTIVE ← 0;
56 |     IF 64-bit Mode
57 |          THEN
58 |               RIP ← fallbackRIP;
59 |          ELSE
60 |               EIP ← fallbackEIP;
61 |     FI;
62 | END</pre>
63 | <h2>Flags Affected</h2>
64 | <p>None</p>
65 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
66 | <p>XABORT:</p>
67 | <p>void _xabort( unsigned int);</p>
68 | <h2>SIMD Floating-Point Exceptions</h2>
69 | <p>None</p>
70 | <h2>Other Exceptions</h2>
71 | <table class="exception-table">
72 | <tr>
73 | <td>#UD</td>
74 | <td>
75 | <p>CPUID.(EAX=7, ECX=0):EBX.RTM[bit 11] = 0.</p>
76 | <p>If LOCK prefix is used.</p></td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/XEND.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>XEND — Transactional End </title></head>
 8 | <body>
 9 | <h1>XEND — Transactional End</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 01 D5</p>
20 | <p>XEND</p></td>
21 | <td>A</td>
22 | <td>V/V</td>
23 | <td>RTM</td>
24 | <td>Specifies the end of an RTM code region.</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand2</td>
31 | <td>Operand3</td>
32 | <td>Operand4</td></tr>
33 | <tr>
34 | <td>A</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>The instruction marks the end of an RTM code region. If this corresponds to the outermost scope (that is, including this XEND instruction, the number of XBEGIN instructions is the same as number of XEND instructions), the logical processor will attempt to commit the logical processor state atomically. If the commit fails, the logical processor will rollback all architectural register and memory updates performed during the RTM execution. The logical processor will resume execution at the fallback address computed from the outermost XBEGIN instruction. The EAX register is updated to reflect RTM abort information.</p>
41 | <p>XEND executed outside a transactional region will cause a #GP (General Protection Fault).</p>
42 | <h2>Operation</h2>
43 | <p><strong>XEND</strong></p>
44 | <pre>IF (RTM_ACTIVE = 0) THEN
45 |     SIGNAL #GP
46 | ELSE
47 |     RTM_NEST_COUNT--
48 |     IF (RTM_NEST_COUNT = 0) THEN
49 |          Try to commit transaction
50 |          IF fail to commit transactional execution
51 |               THEN
52 |                     GOTO RTM_ABORT_PROCESSING;
53 |               ELSE (* commit success *)
54 |                     RTM_ACTIVE ← 0
55 |          FI;
56 |     FI;
57 | FI;
58 | (* For any RTM abort condition encountered during RTM execution *)
59 | RTM_ABORT_PROCESSING:
60 |     Restore architectural register state
61 |     Discard memory updates performed in transaction
62 |     Update EAX with status
63 |     RTM_NEST_COUNT ← 0
64 |     RTM_ACTIVE ← 0
65 |     IF 64-bit Mode
66 |          THEN
67 |               RIP ← fallbackRIP
68 |          ELSE
69 |               EIP ← fallbackEIP
70 |     FI;
71 | END</pre>
72 | <h2>Flags Affected</h2>
73 | <p>None</p>
74 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
75 | <p>XEND:</p>
76 | <p>void _xend( void );</p>
77 | <h2>SIMD Floating-Point Exceptions</h2>
78 | <p>None</p>
79 | <h2>Other Exceptions</h2>
80 | <table class="exception-table">
81 | <tr>
82 | <td>#UD</td>
83 | <td>
84 | <p>CPUID.(EAX=7, ECX=0):EBX.RTM[bit 11] = 0.</p>
85 | <p>If LOCK or 66H or F2H or F3H prefix is used.</p></td></tr>
86 | <tr>
87 | <td>#GP(0)</td>
88 | <td>If RTM_ACTIVE = 0.</td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/XTEST.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | 
 3 | <html>
 4 | <head>
 5 | <meta charset="UTF-8">
 6 | <link href="style.css" type="text/css" rel="stylesheet">
 7 | <title>XTEST — Test If In Transactional Execution </title></head>
 8 | <body>
 9 | <h1>XTEST — Test If In Transactional Execution</h1>
10 | <table>
11 | <tr>
12 | <th>Opcode/Instruction</th>
13 | <th>Op/En</th>
14 | <th>64/32bit Mode Support</th>
15 | <th>CPUID Feature Flag</th>
16 | <th>Description</th></tr>
17 | <tr>
18 | <td>
19 | <p>0F 01 D6</p>
20 | <p>XTEST</p></td>
21 | <td>A</td>
22 | <td>V/V</td>
23 | <td>HLE or RTM</td>
24 | <td>Test if executing in a transactional region</td></tr></table>
25 | <h3>Instruction Operand Encoding</h3>
26 | <table>
27 | <tr>
28 | <td>Op/En</td>
29 | <td>Operand 1</td>
30 | <td>Operand2</td>
31 | <td>Operand3</td>
32 | <td>Operand4</td></tr>
33 | <tr>
34 | <td>A</td>
35 | <td>NA</td>
36 | <td>NA</td>
37 | <td>NA</td>
38 | <td>NA</td></tr></table>
39 | <h2>Description</h2>
40 | <p>The XTEST instruction queries the transactional execution status. If the instruction executes inside a transaction-ally executing RTM region or a transactionally executing HLE region, then the ZF flag is cleared, else it is set.</p>
41 | <h2>Operation</h2>
42 | <p><strong>XTEST</strong></p>
43 | <pre>IF (RTM_ACTIVE = 1 OR HLE_ACTIVE = 1)
44 |     THEN
45 |          ZF ← 0
46 |     ELSE
47 |          ZF ← 1
48 | FI;</pre>
49 | <h2>Flags Affected</h2>
50 | <p>The ZF flag is cleared if the instruction is executed transactionally; otherwise it is set to 1. The CF, OF, SF, PF, and AF, flags are cleared.</p>
51 | <h2>Intel C/C++ Compiler Intrinsic Equivalent</h2>
52 | <p>XTEST:</p>
53 | <p>int _xtest( void );</p>
54 | <h2>SIMD Floating-Point Exceptions</h2>
55 | <p>None</p>
56 | <h2>Other Exceptions</h2>
57 | <table class="exception-table">
58 | <tr>
59 | <td>#UD</td>
60 | <td>
61 | <p>CPUID.(EAX=7, ECX=0):HLE[bit 4] = 0 and CPUID.(EAX=7, ECX=0):RTM[bit 11] = 0.</p>
62 | <p>If LOCK or 66H or F2H or F3H prefix is used.</p></td></tr></table></body></html>


--------------------------------------------------------------------------------
/html/style.css:
--------------------------------------------------------------------------------
1 | table { border-collapse: collapse }
2 | th, td { padding: 0px 10px; border: 1px #ddd solid; vertical-align: top }
3 | svg { display: block; margin: 0px auto }
4 | svg + h3 { text-align: center; }
5 | 
6 | table.opcodes { font: 10pt "Courier New", monospace; }
7 | 
8 | .notes { font-size: 9pt; }
9 | 


--------------------------------------------------------------------------------
/parsejson.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # -*- coding: UTF-8 -*-
 3 | 
 4 | import sys
 5 | try:
 6 | 	import ujson as json
 7 | except ImportError:
 8 | 	import json
 9 | from htmltext import *
10 | 
11 | def main(argv):
12 | 	for arg in argv[1:]:
13 | 		with open(arg, "rb") as f:
14 | 
15 | 			opcodes = json.loads(f.read())
16 | 
17 | 			title = u"x86"
18 | 			result = [""]
19 | 			text = HtmlText()
20 | 			text.append(OpenTag("html"))
21 | 			text.append(OpenTag("head"))
22 | 			text.append(OpenTag("meta", attributes={"charset": "UTF-8"}, self_closes=True))
23 | 			text.append(OpenTag("link", attributes={"rel": "stylesheet", "type": "text/css", "href": "style.css"}, self_closes=True))
24 | 			text.append(OpenTag("title"))
25 | 			text.append(title)
26 | 			text.append(CloseTag("title"))
27 | 			text.append(CloseTag("head"))
28 | 			text.append(OpenTag("body"))
29 | 
30 | 			text.append(OpenTag("table", attributes={"class": "opcodes"}))
31 | 
32 | 			columns = ["Opcode", "Instruction", "Description"]
33 | 
34 | 			text.append(OpenTag("tr"))
35 | 			for column in columns:
36 | 				text.append(OpenTag("th"))
37 | 				text.append(column)
38 | 				text.append(CloseTag("th"))
39 | 			text.append(CloseTag("tr"))
40 | 
41 | 			for opcode in opcodes:
42 | 				text.append(OpenTag("tr"))
43 | 				for column in columns:
44 | 					value = opcode[column]
45 | 					text.append(OpenTag("td"))
46 | 					text.append(value)
47 | 					text.append(CloseTag("td"))
48 | 				text.append(CloseTag("tr"))
49 | 
50 | 			text.append(CloseTag("table"))
51 | 
52 | 			with open("html/_opcodes.html", "wb") as g:
53 | 				g.write("<!DOCTYPE html>\n" + text.to_html().encode('ascii', 'xmlcharrefreplace'))
54 | 
55 | 
56 | if __name__ == "__main__":
57 | 	result = main(sys.argv)
58 | 	sys.exit(result)
59 | 


--------------------------------------------------------------------------------