Browse Source

Add x86 instruction sets FP16, BF16, 4VNNIW, 4FMAPS. Small updates.

Margers 2 months ago
parent
commit
cca0c2e111

+ 180 - 6
compiler/i386/i386att.inc

@@ -968,7 +968,6 @@
 'vpermilps',
 'vpermilps',
 'vpextrb',
 'vpextrb',
 'vpextrd',
 'vpextrd',
-'vpextrq',
 'vpextrw',
 'vpextrw',
 'vphaddd',
 'vphaddd',
 'vphaddsw',
 'vphaddsw',
@@ -979,7 +978,6 @@
 'vphsubw',
 'vphsubw',
 'vpinsrb',
 'vpinsrb',
 'vpinsrd',
 'vpinsrd',
-'vpinsrq',
 'vpinsrw',
 'vpinsrw',
 'vpmaddubsw',
 'vpmaddubsw',
 'vpmaddwd',
 'vpmaddwd',
@@ -1199,11 +1197,8 @@
 'xgetbv',
 'xgetbv',
 'xsetbv',
 'xsetbv',
 'xsave',
 'xsave',
-'xsave64',
 'xrstor',
 'xrstor',
-'xrstor64',
 'xsaveopt',
 'xsaveopt',
-'xsaveopt64',
 'prefetchwt1',
 'prefetchwt1',
 'kaddb',
 'kaddb',
 'kaddd',
 'kaddd',
@@ -1573,6 +1568,185 @@
 'gf2p8affineinvqb',
 'gf2p8affineinvqb',
 'gf2p8affineqb',
 'gf2p8affineqb',
 'gf2p8mulb',
 'gf2p8mulb',
+'vcvtne2ps2bf16',
+'vcvtneps2bf16',
+'vdpbf16ps',
+'v4fmaddps',
+'v4fmaddss',
+'v4fnmaddps',
+'v4fnmaddss',
+'vp4dpwssd',
+'vp4dpwssds',
 'vp2intersectd',
 'vp2intersectd',
-'vp2intersectq'
+'vp2intersectq',
+'vmovw',
+'vmovsh',
+'vaddph',
+'vaddsh',
+'vcmpeqph',
+'vcmpltph',
+'vcmpleph',
+'vcmpunordph',
+'vcmpneqph',
+'vcmpnltph',
+'vcmpnleph',
+'vcmpordph',
+'vcmpeq_uqph',
+'vcmpngeph',
+'vcmpngtph',
+'vcmpfalseph',
+'vcmpneq_oqph',
+'vcmpgeph',
+'vcmpgtph',
+'vcmptrueph',
+'vcmpeq_osph',
+'vcmplt_oqph',
+'vcmple_oqph',
+'vcmpunord_sph',
+'vcmpneq_usph',
+'vcmpnlt_uqph',
+'vcmpnle_uqph',
+'vcmpord_sph',
+'vcmpeq_usph',
+'vcmpnge_uqph',
+'vcmpngt_uqph',
+'vcmpfalse_osph',
+'vcmpneq_osph',
+'vcmpge_oqph',
+'vcmpgt_oqph',
+'vcmptrue_usph',
+'vcmpeqsh',
+'vcmpltsh',
+'vcmplesh',
+'vcmpunordsh',
+'vcmpneqsh',
+'vcmpnltsh',
+'vcmpnlesh',
+'vcmpordsh',
+'vcmpeq_uqsh',
+'vcmpngesh',
+'vcmpngtsh',
+'vcmpfalsesh',
+'vcmpneq_oqsh',
+'vcmpgesh',
+'vcmpgtsh',
+'vcmptruesh',
+'vcmpeq_ossh',
+'vcmplt_oqsh',
+'vcmple_oqsh',
+'vcmpunord_ssh',
+'vcmpneq_ussh',
+'vcmpnlt_uqsh',
+'vcmpnle_uqsh',
+'vcmpord_ssh',
+'vcmpeq_ussh',
+'vcmpnge_uqsh',
+'vcmpngt_uqsh',
+'vcmpfalse_ossh',
+'vcmpneq_ossh',
+'vcmpge_oqsh',
+'vcmpgt_oqsh',
+'vcmptrue_ussh',
+'vcmpph',
+'vcmpsh',
+'vcomish',
+'vcvtdq2ph',
+'vcvtpd2ph',
+'vcvtph2dq',
+'vcvtph2pd',
+'vcvtph2psx',
+'vcvtph2qq',
+'vcvtph2udq',
+'vcvtph2uqq',
+'vcvtph2uw',
+'vcvtph2w',
+'vcvtps2phx',
+'vcvtqq2ph',
+'vcvtsd2sh',
+'vcvtsh2sd',
+'vcvtsh2si',
+'vcvtsh2ss',
+'vcvtsh2usi',
+'vcvtsi2sh',
+'vcvtss2sh',
+'vcvttph2dq',
+'vcvttph2qq',
+'vcvttph2udq',
+'vcvttph2uqq',
+'vcvttph2uw',
+'vcvttph2w',
+'vcvttsh2si',
+'vcvttsh2usi',
+'vcvtudq2ph',
+'vcvtuqq2ph',
+'vcvtusi2sh',
+'vcvtuw2ph',
+'vcvtw2ph',
+'vdivph',
+'vdivsh',
+'vfcmaddcph',
+'vfcmaddcsh',
+'vfmaddcph',
+'vfmaddcsh',
+'vfcmulcph',
+'vfcmulcsh',
+'vfmulcph',
+'vfmulcsh',
+'vfmaddsub132ph',
+'vfmaddsub213ph',
+'vfmaddsub231ph',
+'vfmsubadd132ph',
+'vfmsubadd213ph',
+'vfmsubadd231ph',
+'vfmadd132ph',
+'vfmadd213ph',
+'vfmadd231ph',
+'vfnmadd132ph',
+'vfnmadd213ph',
+'vfnmadd231ph',
+'vfmadd132sh',
+'vfmadd213sh',
+'vfmadd231sh',
+'vfnmadd132sh',
+'vfnmadd213sh',
+'vfnmadd231sh',
+'vfmsub132ph',
+'vfmsub213ph',
+'vfmsub231ph',
+'vfnmsub132ph',
+'vfnmsub213ph',
+'vfnmsub231ph',
+'vfmsub132sh',
+'vfmsub213sh',
+'vfmsub231sh',
+'vfnmsub132sh',
+'vfnmsub213sh',
+'vfnmsub231sh',
+'vfpclassph',
+'vfpclasssh',
+'vgetexpph',
+'vgetexpsh',
+'vgetmantph',
+'vgetmantsh',
+'vmaxph',
+'vmaxsh',
+'vminph',
+'vminsh',
+'vmulph',
+'vmulsh',
+'vrcpph',
+'vrcpsh',
+'vreduceph',
+'vreducesh',
+'vrndscaleph',
+'vrndscalesh',
+'vrsqrtph',
+'vrsqrtsh',
+'vscalefph',
+'vscalefsh',
+'vsqrtph',
+'vsqrtsh',
+'vsubph',
+'vsubsh',
+'vucomish'
 );
 );

+ 179 - 5
compiler/i386/i386atts.inc

@@ -1095,8 +1095,6 @@ attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
-attsufNONE,
-attsufNONE,
 attsufINT,
 attsufINT,
 attsufINT,
 attsufINT,
 attsufNONE,
 attsufNONE,
@@ -1201,9 +1199,6 @@ attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
-attsufNONE,
-attsufNONE,
-attsufNONE,
 attsufINT,
 attsufINT,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
@@ -1574,5 +1569,184 @@ attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
+attsufMMX,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMX,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMX,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMX,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
 attsufNONE
 attsufNONE
 );
 );

+ 180 - 6
compiler/i386/i386int.inc

@@ -968,7 +968,6 @@
 'vpermilps',
 'vpermilps',
 'vpextrb',
 'vpextrb',
 'vpextrd',
 'vpextrd',
-'vpextrq',
 'vpextrw',
 'vpextrw',
 'vphaddd',
 'vphaddd',
 'vphaddsw',
 'vphaddsw',
@@ -979,7 +978,6 @@
 'vphsubw',
 'vphsubw',
 'vpinsrb',
 'vpinsrb',
 'vpinsrd',
 'vpinsrd',
-'vpinsrq',
 'vpinsrw',
 'vpinsrw',
 'vpmaddubsw',
 'vpmaddubsw',
 'vpmaddwd',
 'vpmaddwd',
@@ -1199,11 +1197,8 @@
 'xgetbv',
 'xgetbv',
 'xsetbv',
 'xsetbv',
 'xsave',
 'xsave',
-'xsave64',
 'xrstor',
 'xrstor',
-'xrstor64',
 'xsaveopt',
 'xsaveopt',
-'xsaveopt64',
 'prefetchwt1',
 'prefetchwt1',
 'kaddb',
 'kaddb',
 'kaddd',
 'kaddd',
@@ -1573,6 +1568,185 @@
 'gf2p8affineinvqb',
 'gf2p8affineinvqb',
 'gf2p8affineqb',
 'gf2p8affineqb',
 'gf2p8mulb',
 'gf2p8mulb',
+'vcvtne2ps2bf16',
+'vcvtneps2bf16',
+'vdpbf16ps',
+'v4fmaddps',
+'v4fmaddss',
+'v4fnmaddps',
+'v4fnmaddss',
+'vp4dpwssd',
+'vp4dpwssds',
 'vp2intersectd',
 'vp2intersectd',
-'vp2intersectq'
+'vp2intersectq',
+'vmovw',
+'vmovsh',
+'vaddph',
+'vaddsh',
+'vcmpeqph',
+'vcmpltph',
+'vcmpleph',
+'vcmpunordph',
+'vcmpneqph',
+'vcmpnltph',
+'vcmpnleph',
+'vcmpordph',
+'vcmpeq_uqph',
+'vcmpngeph',
+'vcmpngtph',
+'vcmpfalseph',
+'vcmpneq_oqph',
+'vcmpgeph',
+'vcmpgtph',
+'vcmptrueph',
+'vcmpeq_osph',
+'vcmplt_oqph',
+'vcmple_oqph',
+'vcmpunord_sph',
+'vcmpneq_usph',
+'vcmpnlt_uqph',
+'vcmpnle_uqph',
+'vcmpord_sph',
+'vcmpeq_usph',
+'vcmpnge_uqph',
+'vcmpngt_uqph',
+'vcmpfalse_osph',
+'vcmpneq_osph',
+'vcmpge_oqph',
+'vcmpgt_oqph',
+'vcmptrue_usph',
+'vcmpeqsh',
+'vcmpltsh',
+'vcmplesh',
+'vcmpunordsh',
+'vcmpneqsh',
+'vcmpnltsh',
+'vcmpnlesh',
+'vcmpordsh',
+'vcmpeq_uqsh',
+'vcmpngesh',
+'vcmpngtsh',
+'vcmpfalsesh',
+'vcmpneq_oqsh',
+'vcmpgesh',
+'vcmpgtsh',
+'vcmptruesh',
+'vcmpeq_ossh',
+'vcmplt_oqsh',
+'vcmple_oqsh',
+'vcmpunord_ssh',
+'vcmpneq_ussh',
+'vcmpnlt_uqsh',
+'vcmpnle_uqsh',
+'vcmpord_ssh',
+'vcmpeq_ussh',
+'vcmpnge_uqsh',
+'vcmpngt_uqsh',
+'vcmpfalse_ossh',
+'vcmpneq_ossh',
+'vcmpge_oqsh',
+'vcmpgt_oqsh',
+'vcmptrue_ussh',
+'vcmpph',
+'vcmpsh',
+'vcomish',
+'vcvtdq2ph',
+'vcvtpd2ph',
+'vcvtph2dq',
+'vcvtph2pd',
+'vcvtph2psx',
+'vcvtph2qq',
+'vcvtph2udq',
+'vcvtph2uqq',
+'vcvtph2uw',
+'vcvtph2w',
+'vcvtps2phx',
+'vcvtqq2ph',
+'vcvtsd2sh',
+'vcvtsh2sd',
+'vcvtsh2si',
+'vcvtsh2ss',
+'vcvtsh2usi',
+'vcvtsi2sh',
+'vcvtss2sh',
+'vcvttph2dq',
+'vcvttph2qq',
+'vcvttph2udq',
+'vcvttph2uqq',
+'vcvttph2uw',
+'vcvttph2w',
+'vcvttsh2si',
+'vcvttsh2usi',
+'vcvtudq2ph',
+'vcvtuqq2ph',
+'vcvtusi2sh',
+'vcvtuw2ph',
+'vcvtw2ph',
+'vdivph',
+'vdivsh',
+'vfcmaddcph',
+'vfcmaddcsh',
+'vfmaddcph',
+'vfmaddcsh',
+'vfcmulcph',
+'vfcmulcsh',
+'vfmulcph',
+'vfmulcsh',
+'vfmaddsub132ph',
+'vfmaddsub213ph',
+'vfmaddsub231ph',
+'vfmsubadd132ph',
+'vfmsubadd213ph',
+'vfmsubadd231ph',
+'vfmadd132ph',
+'vfmadd213ph',
+'vfmadd231ph',
+'vfnmadd132ph',
+'vfnmadd213ph',
+'vfnmadd231ph',
+'vfmadd132sh',
+'vfmadd213sh',
+'vfmadd231sh',
+'vfnmadd132sh',
+'vfnmadd213sh',
+'vfnmadd231sh',
+'vfmsub132ph',
+'vfmsub213ph',
+'vfmsub231ph',
+'vfnmsub132ph',
+'vfnmsub213ph',
+'vfnmsub231ph',
+'vfmsub132sh',
+'vfmsub213sh',
+'vfmsub231sh',
+'vfnmsub132sh',
+'vfnmsub213sh',
+'vfnmsub231sh',
+'vfpclassph',
+'vfpclasssh',
+'vgetexpph',
+'vgetexpsh',
+'vgetmantph',
+'vgetmantsh',
+'vmaxph',
+'vmaxsh',
+'vminph',
+'vminsh',
+'vmulph',
+'vmulsh',
+'vrcpph',
+'vrcpsh',
+'vreduceph',
+'vreducesh',
+'vrndscaleph',
+'vrndscalesh',
+'vrsqrtph',
+'vrsqrtsh',
+'vscalefph',
+'vscalefsh',
+'vsqrtph',
+'vsqrtsh',
+'vsubph',
+'vsubsh',
+'vucomish'
 );
 );

+ 1 - 1
compiler/i386/i386nop.inc

@@ -1,2 +1,2 @@
 { don't edit, this file is generated from x86ins.dat }
 { don't edit, this file is generated from x86ins.dat }
-5111;
+5980;

+ 180 - 6
compiler/i386/i386op.inc

@@ -968,7 +968,6 @@ A_VPERMILPD,
 A_VPERMILPS,
 A_VPERMILPS,
 A_VPEXTRB,
 A_VPEXTRB,
 A_VPEXTRD,
 A_VPEXTRD,
-A_VPEXTRQ,
 A_VPEXTRW,
 A_VPEXTRW,
 A_VPHADDD,
 A_VPHADDD,
 A_VPHADDSW,
 A_VPHADDSW,
@@ -979,7 +978,6 @@ A_VPHSUBSW,
 A_VPHSUBW,
 A_VPHSUBW,
 A_VPINSRB,
 A_VPINSRB,
 A_VPINSRD,
 A_VPINSRD,
-A_VPINSRQ,
 A_VPINSRW,
 A_VPINSRW,
 A_VPMADDUBSW,
 A_VPMADDUBSW,
 A_VPMADDWD,
 A_VPMADDWD,
@@ -1199,11 +1197,8 @@ A_RDSEED,
 A_XGETBV,
 A_XGETBV,
 A_XSETBV,
 A_XSETBV,
 A_XSAVE,
 A_XSAVE,
-A_XSAVE64,
 A_XRSTOR,
 A_XRSTOR,
-A_XRSTOR64,
 A_XSAVEOPT,
 A_XSAVEOPT,
-A_XSAVEOPT64,
 A_PREFETCHWT1,
 A_PREFETCHWT1,
 A_KADDB,
 A_KADDB,
 A_KADDD,
 A_KADDD,
@@ -1573,6 +1568,185 @@ A_VGF2P8MULB,
 A_GF2P8AFFINEINVQB,
 A_GF2P8AFFINEINVQB,
 A_GF2P8AFFINEQB,
 A_GF2P8AFFINEQB,
 A_GF2P8MULB,
 A_GF2P8MULB,
+A_VCVTNE2PS2BF16,
+A_VCVTNEPS2BF16,
+A_VDPBF16PS,
+A_V4FMADDPS,
+A_V4FMADDSS,
+A_V4FNMADDPS,
+A_V4FNMADDSS,
+A_VP4DPWSSD,
+A_VP4DPWSSDS,
 A_VP2INTERSECTD,
 A_VP2INTERSECTD,
-A_VP2INTERSECTQ
+A_VP2INTERSECTQ,
+A_VMOVW,
+A_VMOVSH,
+A_VADDPH,
+A_VADDSH,
+A_VCMPEQPH,
+A_VCMPLTPH,
+A_VCMPLEPH,
+A_VCMPUNORDPH,
+A_VCMPNEQPH,
+A_VCMPNLTPH,
+A_VCMPNLEPH,
+A_VCMPORDPH,
+A_VCMPEQ_UQPH,
+A_VCMPNGEPH,
+A_VCMPNGTPH,
+A_VCMPFALSEPH,
+A_VCMPNEQ_OQPH,
+A_VCMPGEPH,
+A_VCMPGTPH,
+A_VCMPTRUEPH,
+A_VCMPEQ_OSPH,
+A_VCMPLT_OQPH,
+A_VCMPLE_OQPH,
+A_VCMPUNORD_SPH,
+A_VCMPNEQ_USPH,
+A_VCMPNLT_UQPH,
+A_VCMPNLE_UQPH,
+A_VCMPORD_SPH,
+A_VCMPEQ_USPH,
+A_VCMPNGE_UQPH,
+A_VCMPNGT_UQPH,
+A_VCMPFALSE_OSPH,
+A_VCMPNEQ_OSPH,
+A_VCMPGE_OQPH,
+A_VCMPGT_OQPH,
+A_VCMPTRUE_USPH,
+A_VCMPEQSH,
+A_VCMPLTSH,
+A_VCMPLESH,
+A_VCMPUNORDSH,
+A_VCMPNEQSH,
+A_VCMPNLTSH,
+A_VCMPNLESH,
+A_VCMPORDSH,
+A_VCMPEQ_UQSH,
+A_VCMPNGESH,
+A_VCMPNGTSH,
+A_VCMPFALSESH,
+A_VCMPNEQ_OQSH,
+A_VCMPGESH,
+A_VCMPGTSH,
+A_VCMPTRUESH,
+A_VCMPEQ_OSSH,
+A_VCMPLT_OQSH,
+A_VCMPLE_OQSH,
+A_VCMPUNORD_SSH,
+A_VCMPNEQ_USSH,
+A_VCMPNLT_UQSH,
+A_VCMPNLE_UQSH,
+A_VCMPORD_SSH,
+A_VCMPEQ_USSH,
+A_VCMPNGE_UQSH,
+A_VCMPNGT_UQSH,
+A_VCMPFALSE_OSSH,
+A_VCMPNEQ_OSSH,
+A_VCMPGE_OQSH,
+A_VCMPGT_OQSH,
+A_VCMPTRUE_USSH,
+A_VCMPPH,
+A_VCMPSH,
+A_VCOMISH,
+A_VCVTDQ2PH,
+A_VCVTPD2PH,
+A_VCVTPH2DQ,
+A_VCVTPH2PD,
+A_VCVTPH2PSX,
+A_VCVTPH2QQ,
+A_VCVTPH2UDQ,
+A_VCVTPH2UQQ,
+A_VCVTPH2UW,
+A_VCVTPH2W,
+A_VCVTPS2PHX,
+A_VCVTQQ2PH,
+A_VCVTSD2SH,
+A_VCVTSH2SD,
+A_VCVTSH2SI,
+A_VCVTSH2SS,
+A_VCVTSH2USI,
+A_VCVTSI2SH,
+A_VCVTSS2SH,
+A_VCVTTPH2DQ,
+A_VCVTTPH2QQ,
+A_VCVTTPH2UDQ,
+A_VCVTTPH2UQQ,
+A_VCVTTPH2UW,
+A_VCVTTPH2W,
+A_VCVTTSH2SI,
+A_VCVTTSH2USI,
+A_VCVTUDQ2PH,
+A_VCVTUQQ2PH,
+A_VCVTUSI2SH,
+A_VCVTUW2PH,
+A_VCVTW2PH,
+A_VDIVPH,
+A_VDIVSH,
+A_VFCMADDCPH,
+A_VFCMADDCSH,
+A_VFMADDCPH,
+A_VFMADDCSH,
+A_VFCMULCPH,
+A_VFCMULCSH,
+A_VFMULCPH,
+A_VFMULCSH,
+A_VFMADDSUB132PH,
+A_VFMADDSUB213PH,
+A_VFMADDSUB231PH,
+A_VFMSUBADD132PH,
+A_VFMSUBADD213PH,
+A_VFMSUBADD231PH,
+A_VFMADD132PH,
+A_VFMADD213PH,
+A_VFMADD231PH,
+A_VFNMADD132PH,
+A_VFNMADD213PH,
+A_VFNMADD231PH,
+A_VFMADD132SH,
+A_VFMADD213SH,
+A_VFMADD231SH,
+A_VFNMADD132SH,
+A_VFNMADD213SH,
+A_VFNMADD231SH,
+A_VFMSUB132PH,
+A_VFMSUB213PH,
+A_VFMSUB231PH,
+A_VFNMSUB132PH,
+A_VFNMSUB213PH,
+A_VFNMSUB231PH,
+A_VFMSUB132SH,
+A_VFMSUB213SH,
+A_VFMSUB231SH,
+A_VFNMSUB132SH,
+A_VFNMSUB213SH,
+A_VFNMSUB231SH,
+A_VFPCLASSPH,
+A_VFPCLASSSH,
+A_VGETEXPPH,
+A_VGETEXPSH,
+A_VGETMANTPH,
+A_VGETMANTSH,
+A_VMAXPH,
+A_VMAXSH,
+A_VMINPH,
+A_VMINSH,
+A_VMULPH,
+A_VMULSH,
+A_VRCPPH,
+A_VRCPSH,
+A_VREDUCEPH,
+A_VREDUCESH,
+A_VRNDSCALEPH,
+A_VRNDSCALESH,
+A_VRSQRTPH,
+A_VRSQRTSH,
+A_VSCALEFPH,
+A_VSCALEFSH,
+A_VSQRTPH,
+A_VSQRTSH,
+A_VSUBPH,
+A_VSUBSH,
+A_VUCOMISH
 );
 );

+ 180 - 6
compiler/i386/i386prop.inc

@@ -969,7 +969,6 @@
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
-(Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
@@ -980,7 +979,6 @@
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
-(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
@@ -1202,9 +1200,6 @@
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
-(Ch: [Ch_All]),
-(Ch: [Ch_All]),
-(Ch: [Ch_All]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
@@ -1574,5 +1569,184 @@
 (Ch: [Ch_Mop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Mop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Mop2, Ch_Rop1]),
 (Ch: [Ch_Mop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
-(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1])
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_All]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1])
 );
 );

File diff suppressed because it is too large
+ 224 - 133
compiler/i386/i386tab.inc


+ 180 - 6
compiler/i8086/i8086att.inc

@@ -968,7 +968,6 @@
 'vpermilps',
 'vpermilps',
 'vpextrb',
 'vpextrb',
 'vpextrd',
 'vpextrd',
-'vpextrq',
 'vpextrw',
 'vpextrw',
 'vphaddd',
 'vphaddd',
 'vphaddsw',
 'vphaddsw',
@@ -979,7 +978,6 @@
 'vphsubw',
 'vphsubw',
 'vpinsrb',
 'vpinsrb',
 'vpinsrd',
 'vpinsrd',
-'vpinsrq',
 'vpinsrw',
 'vpinsrw',
 'vpmaddubsw',
 'vpmaddubsw',
 'vpmaddwd',
 'vpmaddwd',
@@ -1213,11 +1211,8 @@
 'xgetbv',
 'xgetbv',
 'xsetbv',
 'xsetbv',
 'xsave',
 'xsave',
-'xsave64',
 'xrstor',
 'xrstor',
-'xrstor64',
 'xsaveopt',
 'xsaveopt',
-'xsaveopt64',
 'prefetchwt1',
 'prefetchwt1',
 'kaddb',
 'kaddb',
 'kaddd',
 'kaddd',
@@ -1587,6 +1582,185 @@
 'gf2p8affineinvqb',
 'gf2p8affineinvqb',
 'gf2p8affineqb',
 'gf2p8affineqb',
 'gf2p8mulb',
 'gf2p8mulb',
+'vcvtne2ps2bf16',
+'vcvtneps2bf16',
+'vdpbf16ps',
+'v4fmaddps',
+'v4fmaddss',
+'v4fnmaddps',
+'v4fnmaddss',
+'vp4dpwssd',
+'vp4dpwssds',
 'vp2intersectd',
 'vp2intersectd',
-'vp2intersectq'
+'vp2intersectq',
+'vmovw',
+'vmovsh',
+'vaddph',
+'vaddsh',
+'vcmpeqph',
+'vcmpltph',
+'vcmpleph',
+'vcmpunordph',
+'vcmpneqph',
+'vcmpnltph',
+'vcmpnleph',
+'vcmpordph',
+'vcmpeq_uqph',
+'vcmpngeph',
+'vcmpngtph',
+'vcmpfalseph',
+'vcmpneq_oqph',
+'vcmpgeph',
+'vcmpgtph',
+'vcmptrueph',
+'vcmpeq_osph',
+'vcmplt_oqph',
+'vcmple_oqph',
+'vcmpunord_sph',
+'vcmpneq_usph',
+'vcmpnlt_uqph',
+'vcmpnle_uqph',
+'vcmpord_sph',
+'vcmpeq_usph',
+'vcmpnge_uqph',
+'vcmpngt_uqph',
+'vcmpfalse_osph',
+'vcmpneq_osph',
+'vcmpge_oqph',
+'vcmpgt_oqph',
+'vcmptrue_usph',
+'vcmpeqsh',
+'vcmpltsh',
+'vcmplesh',
+'vcmpunordsh',
+'vcmpneqsh',
+'vcmpnltsh',
+'vcmpnlesh',
+'vcmpordsh',
+'vcmpeq_uqsh',
+'vcmpngesh',
+'vcmpngtsh',
+'vcmpfalsesh',
+'vcmpneq_oqsh',
+'vcmpgesh',
+'vcmpgtsh',
+'vcmptruesh',
+'vcmpeq_ossh',
+'vcmplt_oqsh',
+'vcmple_oqsh',
+'vcmpunord_ssh',
+'vcmpneq_ussh',
+'vcmpnlt_uqsh',
+'vcmpnle_uqsh',
+'vcmpord_ssh',
+'vcmpeq_ussh',
+'vcmpnge_uqsh',
+'vcmpngt_uqsh',
+'vcmpfalse_ossh',
+'vcmpneq_ossh',
+'vcmpge_oqsh',
+'vcmpgt_oqsh',
+'vcmptrue_ussh',
+'vcmpph',
+'vcmpsh',
+'vcomish',
+'vcvtdq2ph',
+'vcvtpd2ph',
+'vcvtph2dq',
+'vcvtph2pd',
+'vcvtph2psx',
+'vcvtph2qq',
+'vcvtph2udq',
+'vcvtph2uqq',
+'vcvtph2uw',
+'vcvtph2w',
+'vcvtps2phx',
+'vcvtqq2ph',
+'vcvtsd2sh',
+'vcvtsh2sd',
+'vcvtsh2si',
+'vcvtsh2ss',
+'vcvtsh2usi',
+'vcvtsi2sh',
+'vcvtss2sh',
+'vcvttph2dq',
+'vcvttph2qq',
+'vcvttph2udq',
+'vcvttph2uqq',
+'vcvttph2uw',
+'vcvttph2w',
+'vcvttsh2si',
+'vcvttsh2usi',
+'vcvtudq2ph',
+'vcvtuqq2ph',
+'vcvtusi2sh',
+'vcvtuw2ph',
+'vcvtw2ph',
+'vdivph',
+'vdivsh',
+'vfcmaddcph',
+'vfcmaddcsh',
+'vfmaddcph',
+'vfmaddcsh',
+'vfcmulcph',
+'vfcmulcsh',
+'vfmulcph',
+'vfmulcsh',
+'vfmaddsub132ph',
+'vfmaddsub213ph',
+'vfmaddsub231ph',
+'vfmsubadd132ph',
+'vfmsubadd213ph',
+'vfmsubadd231ph',
+'vfmadd132ph',
+'vfmadd213ph',
+'vfmadd231ph',
+'vfnmadd132ph',
+'vfnmadd213ph',
+'vfnmadd231ph',
+'vfmadd132sh',
+'vfmadd213sh',
+'vfmadd231sh',
+'vfnmadd132sh',
+'vfnmadd213sh',
+'vfnmadd231sh',
+'vfmsub132ph',
+'vfmsub213ph',
+'vfmsub231ph',
+'vfnmsub132ph',
+'vfnmsub213ph',
+'vfnmsub231ph',
+'vfmsub132sh',
+'vfmsub213sh',
+'vfmsub231sh',
+'vfnmsub132sh',
+'vfnmsub213sh',
+'vfnmsub231sh',
+'vfpclassph',
+'vfpclasssh',
+'vgetexpph',
+'vgetexpsh',
+'vgetmantph',
+'vgetmantsh',
+'vmaxph',
+'vmaxsh',
+'vminph',
+'vminsh',
+'vmulph',
+'vmulsh',
+'vrcpph',
+'vrcpsh',
+'vreduceph',
+'vreducesh',
+'vrndscaleph',
+'vrndscalesh',
+'vrsqrtph',
+'vrsqrtsh',
+'vscalefph',
+'vscalefsh',
+'vsqrtph',
+'vsqrtsh',
+'vsubph',
+'vsubsh',
+'vucomish'
 );
 );

+ 179 - 5
compiler/i8086/i8086atts.inc

@@ -1095,8 +1095,6 @@ attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
-attsufNONE,
-attsufNONE,
 attsufINT,
 attsufINT,
 attsufINT,
 attsufINT,
 attsufNONE,
 attsufNONE,
@@ -1215,9 +1213,6 @@ attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
-attsufNONE,
-attsufNONE,
-attsufNONE,
 attsufINT,
 attsufINT,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
@@ -1588,5 +1583,184 @@ attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
+attsufMMX,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMX,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMX,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMX,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
 attsufNONE
 attsufNONE
 );
 );

+ 180 - 6
compiler/i8086/i8086int.inc

@@ -968,7 +968,6 @@
 'vpermilps',
 'vpermilps',
 'vpextrb',
 'vpextrb',
 'vpextrd',
 'vpextrd',
-'vpextrq',
 'vpextrw',
 'vpextrw',
 'vphaddd',
 'vphaddd',
 'vphaddsw',
 'vphaddsw',
@@ -979,7 +978,6 @@
 'vphsubw',
 'vphsubw',
 'vpinsrb',
 'vpinsrb',
 'vpinsrd',
 'vpinsrd',
-'vpinsrq',
 'vpinsrw',
 'vpinsrw',
 'vpmaddubsw',
 'vpmaddubsw',
 'vpmaddwd',
 'vpmaddwd',
@@ -1213,11 +1211,8 @@
 'xgetbv',
 'xgetbv',
 'xsetbv',
 'xsetbv',
 'xsave',
 'xsave',
-'xsave64',
 'xrstor',
 'xrstor',
-'xrstor64',
 'xsaveopt',
 'xsaveopt',
-'xsaveopt64',
 'prefetchwt1',
 'prefetchwt1',
 'kaddb',
 'kaddb',
 'kaddd',
 'kaddd',
@@ -1587,6 +1582,185 @@
 'gf2p8affineinvqb',
 'gf2p8affineinvqb',
 'gf2p8affineqb',
 'gf2p8affineqb',
 'gf2p8mulb',
 'gf2p8mulb',
+'vcvtne2ps2bf16',
+'vcvtneps2bf16',
+'vdpbf16ps',
+'v4fmaddps',
+'v4fmaddss',
+'v4fnmaddps',
+'v4fnmaddss',
+'vp4dpwssd',
+'vp4dpwssds',
 'vp2intersectd',
 'vp2intersectd',
-'vp2intersectq'
+'vp2intersectq',
+'vmovw',
+'vmovsh',
+'vaddph',
+'vaddsh',
+'vcmpeqph',
+'vcmpltph',
+'vcmpleph',
+'vcmpunordph',
+'vcmpneqph',
+'vcmpnltph',
+'vcmpnleph',
+'vcmpordph',
+'vcmpeq_uqph',
+'vcmpngeph',
+'vcmpngtph',
+'vcmpfalseph',
+'vcmpneq_oqph',
+'vcmpgeph',
+'vcmpgtph',
+'vcmptrueph',
+'vcmpeq_osph',
+'vcmplt_oqph',
+'vcmple_oqph',
+'vcmpunord_sph',
+'vcmpneq_usph',
+'vcmpnlt_uqph',
+'vcmpnle_uqph',
+'vcmpord_sph',
+'vcmpeq_usph',
+'vcmpnge_uqph',
+'vcmpngt_uqph',
+'vcmpfalse_osph',
+'vcmpneq_osph',
+'vcmpge_oqph',
+'vcmpgt_oqph',
+'vcmptrue_usph',
+'vcmpeqsh',
+'vcmpltsh',
+'vcmplesh',
+'vcmpunordsh',
+'vcmpneqsh',
+'vcmpnltsh',
+'vcmpnlesh',
+'vcmpordsh',
+'vcmpeq_uqsh',
+'vcmpngesh',
+'vcmpngtsh',
+'vcmpfalsesh',
+'vcmpneq_oqsh',
+'vcmpgesh',
+'vcmpgtsh',
+'vcmptruesh',
+'vcmpeq_ossh',
+'vcmplt_oqsh',
+'vcmple_oqsh',
+'vcmpunord_ssh',
+'vcmpneq_ussh',
+'vcmpnlt_uqsh',
+'vcmpnle_uqsh',
+'vcmpord_ssh',
+'vcmpeq_ussh',
+'vcmpnge_uqsh',
+'vcmpngt_uqsh',
+'vcmpfalse_ossh',
+'vcmpneq_ossh',
+'vcmpge_oqsh',
+'vcmpgt_oqsh',
+'vcmptrue_ussh',
+'vcmpph',
+'vcmpsh',
+'vcomish',
+'vcvtdq2ph',
+'vcvtpd2ph',
+'vcvtph2dq',
+'vcvtph2pd',
+'vcvtph2psx',
+'vcvtph2qq',
+'vcvtph2udq',
+'vcvtph2uqq',
+'vcvtph2uw',
+'vcvtph2w',
+'vcvtps2phx',
+'vcvtqq2ph',
+'vcvtsd2sh',
+'vcvtsh2sd',
+'vcvtsh2si',
+'vcvtsh2ss',
+'vcvtsh2usi',
+'vcvtsi2sh',
+'vcvtss2sh',
+'vcvttph2dq',
+'vcvttph2qq',
+'vcvttph2udq',
+'vcvttph2uqq',
+'vcvttph2uw',
+'vcvttph2w',
+'vcvttsh2si',
+'vcvttsh2usi',
+'vcvtudq2ph',
+'vcvtuqq2ph',
+'vcvtusi2sh',
+'vcvtuw2ph',
+'vcvtw2ph',
+'vdivph',
+'vdivsh',
+'vfcmaddcph',
+'vfcmaddcsh',
+'vfmaddcph',
+'vfmaddcsh',
+'vfcmulcph',
+'vfcmulcsh',
+'vfmulcph',
+'vfmulcsh',
+'vfmaddsub132ph',
+'vfmaddsub213ph',
+'vfmaddsub231ph',
+'vfmsubadd132ph',
+'vfmsubadd213ph',
+'vfmsubadd231ph',
+'vfmadd132ph',
+'vfmadd213ph',
+'vfmadd231ph',
+'vfnmadd132ph',
+'vfnmadd213ph',
+'vfnmadd231ph',
+'vfmadd132sh',
+'vfmadd213sh',
+'vfmadd231sh',
+'vfnmadd132sh',
+'vfnmadd213sh',
+'vfnmadd231sh',
+'vfmsub132ph',
+'vfmsub213ph',
+'vfmsub231ph',
+'vfnmsub132ph',
+'vfnmsub213ph',
+'vfnmsub231ph',
+'vfmsub132sh',
+'vfmsub213sh',
+'vfmsub231sh',
+'vfnmsub132sh',
+'vfnmsub213sh',
+'vfnmsub231sh',
+'vfpclassph',
+'vfpclasssh',
+'vgetexpph',
+'vgetexpsh',
+'vgetmantph',
+'vgetmantsh',
+'vmaxph',
+'vmaxsh',
+'vminph',
+'vminsh',
+'vmulph',
+'vmulsh',
+'vrcpph',
+'vrcpsh',
+'vreduceph',
+'vreducesh',
+'vrndscaleph',
+'vrndscalesh',
+'vrsqrtph',
+'vrsqrtsh',
+'vscalefph',
+'vscalefsh',
+'vsqrtph',
+'vsqrtsh',
+'vsubph',
+'vsubsh',
+'vucomish'
 );
 );

+ 1 - 1
compiler/i8086/i8086nop.inc

@@ -1,2 +1,2 @@
 { don't edit, this file is generated from x86ins.dat }
 { don't edit, this file is generated from x86ins.dat }
-5143;
+6012;

+ 180 - 6
compiler/i8086/i8086op.inc

@@ -968,7 +968,6 @@ A_VPERMILPD,
 A_VPERMILPS,
 A_VPERMILPS,
 A_VPEXTRB,
 A_VPEXTRB,
 A_VPEXTRD,
 A_VPEXTRD,
-A_VPEXTRQ,
 A_VPEXTRW,
 A_VPEXTRW,
 A_VPHADDD,
 A_VPHADDD,
 A_VPHADDSW,
 A_VPHADDSW,
@@ -979,7 +978,6 @@ A_VPHSUBSW,
 A_VPHSUBW,
 A_VPHSUBW,
 A_VPINSRB,
 A_VPINSRB,
 A_VPINSRD,
 A_VPINSRD,
-A_VPINSRQ,
 A_VPINSRW,
 A_VPINSRW,
 A_VPMADDUBSW,
 A_VPMADDUBSW,
 A_VPMADDWD,
 A_VPMADDWD,
@@ -1213,11 +1211,8 @@ A_RDSEED,
 A_XGETBV,
 A_XGETBV,
 A_XSETBV,
 A_XSETBV,
 A_XSAVE,
 A_XSAVE,
-A_XSAVE64,
 A_XRSTOR,
 A_XRSTOR,
-A_XRSTOR64,
 A_XSAVEOPT,
 A_XSAVEOPT,
-A_XSAVEOPT64,
 A_PREFETCHWT1,
 A_PREFETCHWT1,
 A_KADDB,
 A_KADDB,
 A_KADDD,
 A_KADDD,
@@ -1587,6 +1582,185 @@ A_VGF2P8MULB,
 A_GF2P8AFFINEINVQB,
 A_GF2P8AFFINEINVQB,
 A_GF2P8AFFINEQB,
 A_GF2P8AFFINEQB,
 A_GF2P8MULB,
 A_GF2P8MULB,
+A_VCVTNE2PS2BF16,
+A_VCVTNEPS2BF16,
+A_VDPBF16PS,
+A_V4FMADDPS,
+A_V4FMADDSS,
+A_V4FNMADDPS,
+A_V4FNMADDSS,
+A_VP4DPWSSD,
+A_VP4DPWSSDS,
 A_VP2INTERSECTD,
 A_VP2INTERSECTD,
-A_VP2INTERSECTQ
+A_VP2INTERSECTQ,
+A_VMOVW,
+A_VMOVSH,
+A_VADDPH,
+A_VADDSH,
+A_VCMPEQPH,
+A_VCMPLTPH,
+A_VCMPLEPH,
+A_VCMPUNORDPH,
+A_VCMPNEQPH,
+A_VCMPNLTPH,
+A_VCMPNLEPH,
+A_VCMPORDPH,
+A_VCMPEQ_UQPH,
+A_VCMPNGEPH,
+A_VCMPNGTPH,
+A_VCMPFALSEPH,
+A_VCMPNEQ_OQPH,
+A_VCMPGEPH,
+A_VCMPGTPH,
+A_VCMPTRUEPH,
+A_VCMPEQ_OSPH,
+A_VCMPLT_OQPH,
+A_VCMPLE_OQPH,
+A_VCMPUNORD_SPH,
+A_VCMPNEQ_USPH,
+A_VCMPNLT_UQPH,
+A_VCMPNLE_UQPH,
+A_VCMPORD_SPH,
+A_VCMPEQ_USPH,
+A_VCMPNGE_UQPH,
+A_VCMPNGT_UQPH,
+A_VCMPFALSE_OSPH,
+A_VCMPNEQ_OSPH,
+A_VCMPGE_OQPH,
+A_VCMPGT_OQPH,
+A_VCMPTRUE_USPH,
+A_VCMPEQSH,
+A_VCMPLTSH,
+A_VCMPLESH,
+A_VCMPUNORDSH,
+A_VCMPNEQSH,
+A_VCMPNLTSH,
+A_VCMPNLESH,
+A_VCMPORDSH,
+A_VCMPEQ_UQSH,
+A_VCMPNGESH,
+A_VCMPNGTSH,
+A_VCMPFALSESH,
+A_VCMPNEQ_OQSH,
+A_VCMPGESH,
+A_VCMPGTSH,
+A_VCMPTRUESH,
+A_VCMPEQ_OSSH,
+A_VCMPLT_OQSH,
+A_VCMPLE_OQSH,
+A_VCMPUNORD_SSH,
+A_VCMPNEQ_USSH,
+A_VCMPNLT_UQSH,
+A_VCMPNLE_UQSH,
+A_VCMPORD_SSH,
+A_VCMPEQ_USSH,
+A_VCMPNGE_UQSH,
+A_VCMPNGT_UQSH,
+A_VCMPFALSE_OSSH,
+A_VCMPNEQ_OSSH,
+A_VCMPGE_OQSH,
+A_VCMPGT_OQSH,
+A_VCMPTRUE_USSH,
+A_VCMPPH,
+A_VCMPSH,
+A_VCOMISH,
+A_VCVTDQ2PH,
+A_VCVTPD2PH,
+A_VCVTPH2DQ,
+A_VCVTPH2PD,
+A_VCVTPH2PSX,
+A_VCVTPH2QQ,
+A_VCVTPH2UDQ,
+A_VCVTPH2UQQ,
+A_VCVTPH2UW,
+A_VCVTPH2W,
+A_VCVTPS2PHX,
+A_VCVTQQ2PH,
+A_VCVTSD2SH,
+A_VCVTSH2SD,
+A_VCVTSH2SI,
+A_VCVTSH2SS,
+A_VCVTSH2USI,
+A_VCVTSI2SH,
+A_VCVTSS2SH,
+A_VCVTTPH2DQ,
+A_VCVTTPH2QQ,
+A_VCVTTPH2UDQ,
+A_VCVTTPH2UQQ,
+A_VCVTTPH2UW,
+A_VCVTTPH2W,
+A_VCVTTSH2SI,
+A_VCVTTSH2USI,
+A_VCVTUDQ2PH,
+A_VCVTUQQ2PH,
+A_VCVTUSI2SH,
+A_VCVTUW2PH,
+A_VCVTW2PH,
+A_VDIVPH,
+A_VDIVSH,
+A_VFCMADDCPH,
+A_VFCMADDCSH,
+A_VFMADDCPH,
+A_VFMADDCSH,
+A_VFCMULCPH,
+A_VFCMULCSH,
+A_VFMULCPH,
+A_VFMULCSH,
+A_VFMADDSUB132PH,
+A_VFMADDSUB213PH,
+A_VFMADDSUB231PH,
+A_VFMSUBADD132PH,
+A_VFMSUBADD213PH,
+A_VFMSUBADD231PH,
+A_VFMADD132PH,
+A_VFMADD213PH,
+A_VFMADD231PH,
+A_VFNMADD132PH,
+A_VFNMADD213PH,
+A_VFNMADD231PH,
+A_VFMADD132SH,
+A_VFMADD213SH,
+A_VFMADD231SH,
+A_VFNMADD132SH,
+A_VFNMADD213SH,
+A_VFNMADD231SH,
+A_VFMSUB132PH,
+A_VFMSUB213PH,
+A_VFMSUB231PH,
+A_VFNMSUB132PH,
+A_VFNMSUB213PH,
+A_VFNMSUB231PH,
+A_VFMSUB132SH,
+A_VFMSUB213SH,
+A_VFMSUB231SH,
+A_VFNMSUB132SH,
+A_VFNMSUB213SH,
+A_VFNMSUB231SH,
+A_VFPCLASSPH,
+A_VFPCLASSSH,
+A_VGETEXPPH,
+A_VGETEXPSH,
+A_VGETMANTPH,
+A_VGETMANTSH,
+A_VMAXPH,
+A_VMAXSH,
+A_VMINPH,
+A_VMINSH,
+A_VMULPH,
+A_VMULSH,
+A_VRCPPH,
+A_VRCPSH,
+A_VREDUCEPH,
+A_VREDUCESH,
+A_VRNDSCALEPH,
+A_VRNDSCALESH,
+A_VRSQRTPH,
+A_VRSQRTSH,
+A_VSCALEFPH,
+A_VSCALEFSH,
+A_VSQRTPH,
+A_VSQRTSH,
+A_VSUBPH,
+A_VSUBSH,
+A_VUCOMISH
 );
 );

+ 180 - 6
compiler/i8086/i8086prop.inc

@@ -969,7 +969,6 @@
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2]),
-(Ch: [Ch_Wop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
@@ -980,7 +979,6 @@
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
-(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
@@ -1216,9 +1214,6 @@
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
 (Ch: [Ch_All]),
-(Ch: [Ch_All]),
-(Ch: [Ch_All]),
-(Ch: [Ch_All]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
@@ -1588,5 +1583,184 @@
 (Ch: [Ch_Mop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Mop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Mop2, Ch_Rop1]),
 (Ch: [Ch_Mop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
-(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1])
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_All]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1])
 );
 );

File diff suppressed because it is too large
+ 224 - 133
compiler/i8086/i8086tab.inc


+ 12 - 0
compiler/x86/aasmcpu.pas

@@ -5618,6 +5618,18 @@ implementation
                      (AsmOp = A_VCVTUSI2SD) or
                      (AsmOp = A_VCVTUSI2SD) or
                      (AsmOp = A_VCVTUSI2SS) or
                      (AsmOp = A_VCVTUSI2SS) or
 
 
+                     (AsmOp = A_vcvtdq2ph) or
+                     (AsmOp = A_vcvtpd2ph) or
+                     (AsmOp = A_vcvtph2pd) or
+                     (AsmOp = A_vcvtqq2ph) or
+                     (AsmOp = A_vcvtsi2sh) or
+                     (AsmOp = A_vcvttph2qq) or
+                     (AsmOp = A_vcvttph2uqq) or
+                     (AsmOp = A_vcvtudq2ph) or
+                     (AsmOp = A_vcvtuqq2ph) or
+                     (AsmOp = A_vcvtusi2sh) or
+                     (AsmOp = A_VCVTNEPS2BF16) or
+                     (AsmOp = A_vcvtps2phx) or
 
 
                      // TODO check
                      // TODO check
                      (AsmOp = A_VCMPSS)
                      (AsmOp = A_VCMPSS)

+ 1562 - 103
compiler/x86/x86ins.dat

@@ -5120,18 +5120,18 @@ xmmreg_mz,xmmreg,xmmreg_er                \334\350\352\362\370\1\x5A\75\120
 ; special handling - gas suffix "S" =>> instructions-opsize = source-operand
 ; special handling - gas suffix "S" =>> instructions-opsize = source-operand
 [VCVTSI2SD,vcvtsi2sdS]
 [VCVTSI2SD,vcvtsi2sdS]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
-xmmreg,xmmreg_er,reg32                    \334\350\362\370\1\x2A\75\120             AVX,SANDYBRIDGE
+xmmreg,xmmreg,reg32                       \334\350\362\370\1\x2A\75\120             AVX,SANDYBRIDGE
 xmmreg,xmmreg_er,reg64                    \334\350\352\362\363\370\1\x2A\75\120     AVX,SANDYBRIDGE,X86_64
 xmmreg,xmmreg_er,reg64                    \334\350\352\362\363\370\1\x2A\75\120     AVX,SANDYBRIDGE,X86_64
-xmmreg,xmmreg_er,mem32                    \334\350\362\370\1\x2A\75\120             AVX,SANDYBRIDGE,T1S
-xmmreg,xmmreg_er,mem64                    \334\350\352\362\363\370\1\x2A\75\120     AVX,SANDYBRIDGE,T1S
+xmmreg,xmmreg,mem32                       \334\350\362\370\1\x2A\75\120             AVX,SANDYBRIDGE,T1S
+xmmreg,xmmreg,mem64                       \334\350\352\362\363\370\1\x2A\75\120     AVX,SANDYBRIDGE,T1S
 
 
 ; special handling - gas suffix "S" =>> instructions-opsize = source-operand
 ; special handling - gas suffix "S" =>> instructions-opsize = source-operand
 [VCVTSI2SS,vcvtsi2ssS]
 [VCVTSI2SS,vcvtsi2ssS]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 xmmreg,xmmreg_er,reg32                    \333\350\362\370\1\x2A\75\120             AVX,SANDYBRIDGE
 xmmreg,xmmreg_er,reg32                    \333\350\362\370\1\x2A\75\120             AVX,SANDYBRIDGE
 xmmreg,xmmreg_er,reg64                    \333\350\352\362\363\370\1\x2A\75\120     AVX,SANDYBRIDGE,X86_64
 xmmreg,xmmreg_er,reg64                    \333\350\352\362\363\370\1\x2A\75\120     AVX,SANDYBRIDGE,X86_64
-xmmreg,xmmreg_er,mem32                    \333\350\362\370\1\x2A\75\120             AVX,SANDYBRIDGE,T1S
-xmmreg,xmmreg_er,mem64                    \333\350\352\362\363\370\1\x2A\75\120     AVX,SANDYBRIDGE,T1S
+xmmreg,xmmreg,mem32                       \333\350\362\370\1\x2A\75\120             AVX,SANDYBRIDGE,T1S
+xmmreg,xmmreg,mem64                       \333\350\352\362\363\370\1\x2A\75\120     AVX,SANDYBRIDGE,T1S
 
 
 [VCVTSS2SD]
 [VCVTSS2SD]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
@@ -5348,9 +5348,9 @@ xmmreg_mz,xmmreg,xmmreg_sae               \333\350\362\370\1\x5D\75\120
 
 
 [VMOVAPD]
 [VMOVAPD]
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
-xmmrm_mz,xmmreg                           \350\352\361\362\370\1\x29\101            AVX,SANDYBRIDGE,TFVM
-ymmrm_mz,ymmreg                           \350\352\361\362\364\370\1\x29\101        AVX,SANDYBRIDGE,TFVM
 zmmrm_mz,zmmreg                           \350\351\352\361\370\1\x29\101            AVX512,TFVM
 zmmrm_mz,zmmreg                           \350\351\352\361\370\1\x29\101            AVX512,TFVM
+ymmrm_mz,ymmreg                           \350\352\361\362\364\370\1\x29\101        AVX,SANDYBRIDGE,TFVM
+xmmrm_mz,xmmreg                           \350\352\361\362\370\1\x29\101            AVX,SANDYBRIDGE,TFVM
 xmmreg_mz,xmmrm                           \350\352\361\362\370\1\x28\110            AVX,SANDYBRIDGE,TFVM
 xmmreg_mz,xmmrm                           \350\352\361\362\370\1\x28\110            AVX,SANDYBRIDGE,TFVM
 ymmreg_mz,ymmrm                           \350\352\361\362\364\370\1\x28\110        AVX,SANDYBRIDGE,TFVM
 ymmreg_mz,ymmrm                           \350\352\361\362\364\370\1\x28\110        AVX,SANDYBRIDGE,TFVM
 zmmreg_mz,zmmrm                           \350\351\352\361\370\1\x28\110            AVX512,TFVM
 zmmreg_mz,zmmrm                           \350\351\352\361\370\1\x28\110            AVX512,TFVM
@@ -5949,7 +5949,7 @@ rm32,xmmreg,imm8                          \350\361\362\372\1\x16\101\26
 
 
 [VPEXTRQ]
 [VPEXTRQ]
 (Ch_Wop3, Ch_Rop2)
 (Ch_Wop3, Ch_Rop2)
-rm64,xmmreg,imm8                          \350\352\361\362\363\372\1\x16\101\26     AVX,SANDYBRIDGE,T1S
+rm64,xmmreg,imm8                          \350\352\361\362\363\372\1\x16\101\26     AVX,SANDYBRIDGE,T1S,X86_64
 
 
 
 
 [VPEXTRW]
 [VPEXTRW]
@@ -6010,7 +6010,7 @@ xmmreg,xmmreg,rm32,imm8                   \350\361\362\372\1\x22\75\120\27
 
 
 [VPINSRQ]
 [VPINSRQ]
 (Ch_Wop4, Ch_Rop3, Ch_Rop2)
 (Ch_Wop4, Ch_Rop3, Ch_Rop2)
-xmmreg,xmmreg,rm64,imm8                   \350\352\361\362\363\372\1\x22\75\120\27  AVX,SANDYBRIDGE,T1S
+xmmreg,xmmreg,rm64,imm8                   \350\352\361\362\363\372\1\x22\75\120\27  AVX,SANDYBRIDGE,T1S,X86_64
 
 
 
 
 [VPINSRW]
 [VPINSRW]
@@ -7141,73 +7141,73 @@ zmmreg_mz,zmmreg,bmem64                   \350\351\352\361\371\1\x45\75\120
 
 
 [VGATHERDPD]
 [VGATHERDPD]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
-xmmreg,xmem32,xmmreg                      \361\362\363\371\1\x92\76\110             AVX2
-xmmreg_m,xmem32                           \350\352\361\371\1\x92\110                AVX512,T1S
-ymmreg,xmem32,ymmreg                      \361\362\363\364\371\1\x92\76\110         AVX2        I
-ymmreg_m,xmem32                           \350\352\361\364\371\1\x92\110            AVX512,T1S
-zmmreg_m,ymem32                           \350\351\352\361\371\1\x92\110            AVX512,T1S
+xmmreg,xmem32,xmmreg                      \361\362\363\371\1\x92\76\110             AVX2,DISTINCT,DALL
+xmmreg_m,xmem32                           \350\352\361\371\1\x92\110                AVX512,T1S,DISTINCT,DALL
+ymmreg,xmem32,ymmreg                      \361\362\363\364\371\1\x92\76\110         AVX2,DISTINCT,DALL
+ymmreg_m,xmem32                           \350\352\361\364\371\1\x92\110            AVX512,T1S,DISTINCT,DALL
+zmmreg_m,ymem32                           \350\351\352\361\371\1\x92\110            AVX512,T1S,DISTINCT,DALL
 
 
 
 
 [VGATHERDPS]
 [VGATHERDPS]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
-xmmreg,xmem32,xmmreg                      \361\362\371\1\x92\76\110                 AVX2
-xmmreg_m,xmem32                           \350\361\371\1\x92\110                    AVX512,T1S
-ymmreg,ymem32,ymmreg                      \361\362\364\371\1\x92\76\110             AVX2
-ymmreg_m,ymem32                           \350\361\364\371\1\x92\110                AVX512,T1S
-zmmreg_m,zmem32                           \350\351\361\371\1\x92\110                AVX512,T1S
+xmmreg,xmem32,xmmreg                      \361\362\371\1\x92\76\110                 AVX2,DISTINCT,DALL
+xmmreg_m,xmem32                           \350\361\371\1\x92\110                    AVX512,T1S,DISTINCT,DALL
+ymmreg,ymem32,ymmreg                      \361\362\364\371\1\x92\76\110             AVX2,DISTINCT,DALL
+ymmreg_m,ymem32                           \350\361\364\371\1\x92\110                AVX512,T1S,DISTINCT,DALL
+zmmreg_m,zmem32                           \350\351\361\371\1\x92\110                AVX512,T1S,DISTINCT,DALL
 
 
 
 
 [VGATHERQPD]
 [VGATHERQPD]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
-xmmreg,xmem64,xmmreg                      \361\362\363\371\1\x93\76\110             AVX2
-xmmreg_m,xmem64                           \350\352\361\371\1\x93\110                AVX512,T1S
-ymmreg,ymem64,ymmreg                      \361\362\363\364\371\1\x93\76\110         AVX2
-ymmreg_m,ymem64                           \350\352\361\364\371\1\x93\110            AVX512,T1S
-zmmreg_m,zmem64                           \350\351\352\361\371\1\x93\110            AVX512,T1S
+xmmreg,xmem64,xmmreg                      \361\362\363\371\1\x93\76\110             AVX2,DISTINCT,DALL
+xmmreg_m,xmem64                           \350\352\361\371\1\x93\110                AVX512,T1S,DISTINCT,DALL
+ymmreg,ymem64,ymmreg                      \361\362\363\364\371\1\x93\76\110         AVX2,DISTINCT,DALL
+ymmreg_m,ymem64                           \350\352\361\364\371\1\x93\110            AVX512,T1S,DISTINCT,DALL
+zmmreg_m,zmem64                           \350\351\352\361\371\1\x93\110            AVX512,T1S,DISTINCT,DALL
 
 
 
 
 [VGATHERQPS]
 [VGATHERQPS]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
-xmmreg,xmem32,xmmreg                      \361\362\371\1\x93\76\110                 AVX2
-xmmreg,ymem32,xmmreg                      \361\362\364\371\1\x93\76\110             AVX2
-xmmreg_m,xmem32                           \350\361\371\1\x93\110                    AVX512,T1S
-xmmreg_m,ymem32                           \350\361\364\371\1\x93\110                AVX512,T1S
-ymmreg_m,zmem32                           \350\351\361\371\1\x93\110                AVX512,T1S
+xmmreg,xmem32,xmmreg                      \361\362\371\1\x93\76\110                 AVX2,DISTINCT,DALL
+xmmreg,ymem32,xmmreg                      \361\362\364\371\1\x93\76\110             AVX2,DISTINCT,DALL
+xmmreg_m,xmem32                           \350\361\371\1\x93\110                    AVX512,T1S,DISTINCT,DALL
+xmmreg_m,ymem32                           \350\361\364\371\1\x93\110                AVX512,T1S,DISTINCT,DALL
+ymmreg_m,zmem32                           \350\351\361\371\1\x93\110                AVX512,T1S,DISTINCT,DALL
 
 
 
 
 [VPGATHERDD]
 [VPGATHERDD]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
-xmmreg,xmem32,xmmreg                      \361\362\371\1\x90\76\110                 AVX2
-xmmreg_m,xmem32                           \350\361\371\1\x90\110                    AVX512,T1S
-ymmreg,ymem32,ymmreg                      \361\362\364\371\1\x90\76\110             AVX2
-ymmreg_m,ymem32                           \350\361\364\371\1\x90\110                AVX512,T1S
-zmmreg_m,zmem32                           \350\351\361\371\1\x90\110                AVX512,T1S
+xmmreg,xmem32,xmmreg                      \361\362\371\1\x90\76\110                 AVX2,DISTINCT,DALL
+xmmreg_m,xmem32                           \350\361\371\1\x90\110                    AVX512,T1S,DISTINCT,DALL
+ymmreg,ymem32,ymmreg                      \361\362\364\371\1\x90\76\110             AVX2,DISTINCT,DALL
+ymmreg_m,ymem32                           \350\361\364\371\1\x90\110                AVX512,T1S,DISTINCT,DALL
+zmmreg_m,zmem32                           \350\351\361\371\1\x90\110                AVX512,T1S,DISTINCT,DALL
 
 
 
 
 [VPGATHERDQ]
 [VPGATHERDQ]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
-xmmreg,xmem64,xmmreg                      \361\362\363\371\1\x90\76\110             AVX2
-xmmreg_m,xmem64                           \350\352\361\371\1\x90\110                AVX512,T1S
-ymmreg,xmem64,ymmreg                      \361\362\363\364\371\1\x90\76\110         AVX2
-ymmreg_m,xmem64                           \350\352\361\364\371\1\x90\110            AVX512,T1S
-zmmreg_m,ymem64                           \350\351\352\361\371\1\x90\110            AVX512,T1S
+xmmreg,xmem64,xmmreg                      \361\362\363\371\1\x90\76\110             AVX2,DISTINCT,DALL
+xmmreg_m,xmem64                           \350\352\361\371\1\x90\110                AVX512,T1S,DISTINCT,DALL
+ymmreg,xmem64,ymmreg                      \361\362\363\364\371\1\x90\76\110         AVX2,DISTINCT,DALL
+ymmreg_m,xmem64                           \350\352\361\364\371\1\x90\110            AVX512,T1S,DISTINCT,DALL
+zmmreg_m,ymem64                           \350\351\352\361\371\1\x90\110            AVX512,T1S,DISTINCT,DALL
 
 
 [VPGATHERQD]
 [VPGATHERQD]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
-xmmreg,xmem32,xmmreg                      \361\362\371\1\x91\76\110                 AVX2
-xmmreg,ymem32,xmmreg                      \361\362\364\371\1\x91\76\110             AVX2
-xmmreg_m,xmem32                           \350\361\371\1\x91\110                    AVX512,T1S
-xmmreg_m,ymem32                           \350\361\364\371\1\x91\110                AVX512,T1S
-ymmreg_m,zmem32                           \350\351\361\371\1\x91\110                AVX512,T1S
+xmmreg,xmem32,xmmreg                      \361\362\371\1\x91\76\110                 AVX2,DISTINCT,DALL
+xmmreg,ymem32,xmmreg                      \361\362\364\371\1\x91\76\110             AVX2,DISTINCT,DALL
+xmmreg_m,xmem32                           \350\361\371\1\x91\110                    AVX512,T1S,DISTINCT,DALL
+xmmreg_m,ymem32                           \350\361\364\371\1\x91\110                AVX512,T1S,DISTINCT,DALL
+ymmreg_m,zmem32                           \350\351\361\371\1\x91\110                AVX512,T1S,DISTINCT,DALL
 
 
 
 
 [VPGATHERQQ]
 [VPGATHERQQ]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
-xmmreg,xmem64,xmmreg                      \361\362\363\371\1\x91\76\110             AVX2
-xmmreg_m,xmem64                           \350\352\361\371\1\x91\110                AVX512,T1S
-ymmreg,ymem64,ymmreg                      \361\362\363\364\371\1\x91\76\110         AVX2
-ymmreg_m,ymem64                           \350\352\361\364\371\1\x91\110            AVX512,T1S
-zmmreg_m,zmem64                           \350\351\352\361\371\1\x91\110            AVX512,T1S
+xmmreg,xmem64,xmmreg                      \361\362\363\371\1\x91\76\110             AVX2,DISTINCT,DALL
+xmmreg_m,xmem64                           \350\352\361\371\1\x91\110                AVX512,T1S,DISTINCT,DALL
+ymmreg,ymem64,ymmreg                      \361\362\363\364\371\1\x91\76\110         AVX2,DISTINCT,DALL
+ymmreg_m,ymem64                           \350\352\361\364\371\1\x91\110            AVX512,T1S,DISTINCT,DALL
+zmmreg_m,zmem64                           \350\351\352\361\371\1\x91\110            AVX512,T1S,DISTINCT,DALL
 
 
 
 
 ;*******************************************************************************
 ;*******************************************************************************
@@ -7831,7 +7831,7 @@ mem                   \2\x0F\xAE\204                                      XSAVE
 
 
 [XSAVE64]
 [XSAVE64]
 (Ch_All)
 (Ch_All)
-mem                   \326\2\x0F\xAE\204                                  XSAVE
+mem                   \326\2\x0F\xAE\204                                  XSAVE,X86_64
 
 
 [XRSTOR]
 [XRSTOR]
 (Ch_All)
 (Ch_All)
@@ -7839,7 +7839,7 @@ mem                   \2\x0F\xAE\205                                      XSAVE
 
 
 [XRSTOR64]
 [XRSTOR64]
 (Ch_All)
 (Ch_All)
-mem                   \326\2\x0F\xAE\205                                  XSAVE
+mem                   \326\2\x0F\xAE\205                                  XSAVE,X86_64
 
 
 [XSAVEOPT]
 [XSAVEOPT]
 (Ch_All)
 (Ch_All)
@@ -7847,7 +7847,7 @@ mem                   \2\x0F\xAE\206                                      XSAVE
 
 
 [XSAVEOPT64]
 [XSAVEOPT64]
 (Ch_All)
 (Ch_All)
-mem                   \326\2\x0F\xAE\206                                  XSAVE
+mem                   \326\2\x0F\xAE\206                                  XSAVE,X86_64
 
 
 
 
 ;*******************************************************************************
 ;*******************************************************************************
@@ -8417,10 +8417,10 @@ ymmreg_mz,bmem64                          \334\350\351\352\370\1\x7A\110
 ; special handling - gas suffix "S" =>> instructions-opsize = source-operand
 ; special handling - gas suffix "S" =>> instructions-opsize = source-operand
 [VCVTUSI2SD,vcvtusi2sdS]
 [VCVTUSI2SD,vcvtusi2sdS]
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
-xmmreg,xmmreg_er,reg32                    \334\350\370\1\x7B\75\120                 AVX512
+xmmreg,xmmreg,reg32                       \334\350\370\1\x7B\75\120                 AVX512
 xmmreg,xmmreg_er,reg64                    \334\350\352\370\1\x7B\75\120             AVX512,X86_64
 xmmreg,xmmreg_er,reg64                    \334\350\352\370\1\x7B\75\120             AVX512,X86_64
-xmmreg,xmmreg_er,mem32                    \334\350\370\1\x7B\75\120                 AVX512,T1S
-xmmreg,xmmreg_er,mem64                    \334\350\352\370\1\x7B\75\120             AVX512,T1S
+xmmreg,xmmreg,mem32                       \334\350\370\1\x7B\75\120                 AVX512,T1S
+xmmreg,xmmreg,mem64                       \334\350\352\370\1\x7B\75\120             AVX512,T1S
 
 
 
 
 ; special handling - gas suffix "S" =>> instructions-opsize = source-operand
 ; special handling - gas suffix "S" =>> instructions-opsize = source-operand
@@ -8428,8 +8428,8 @@ xmmreg,xmmreg_er,mem64                    \334\350\352\370\1\x7B\75\120
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
 xmmreg,xmmreg_er,reg32                    \333\350\370\1\x7B\75\120                 AVX512
 xmmreg,xmmreg_er,reg32                    \333\350\370\1\x7B\75\120                 AVX512
 xmmreg,xmmreg_er,reg64                    \333\350\352\370\1\x7B\75\120             AVX512,X86_64
 xmmreg,xmmreg_er,reg64                    \333\350\352\370\1\x7B\75\120             AVX512,X86_64
-xmmreg,xmmreg_er,mem32                    \333\350\370\1\x7B\75\120                 AVX512,T1S
-xmmreg,xmmreg_er,mem64                    \333\350\352\370\1\x7B\75\120             AVX512,T1S
+xmmreg,xmmreg,mem32                       \333\350\370\1\x7B\75\120                 AVX512,T1S
+xmmreg,xmmreg,mem64                       \333\350\352\370\1\x7B\75\120             AVX512,T1S
 
 
 [VDBPSADBW]
 [VDBPSADBW]
 (Ch_Wop4, Ch_Rop3, Ch_Rop2)
 (Ch_Wop4, Ch_Rop3, Ch_Rop2)
@@ -8681,57 +8681,75 @@ zmmreg_mz,zmmreg,ymmrm,imm8               \350\351\352\361\372\1\x3A\75\120\27
 
 
 [VMOVDQA32]
 [VMOVDQA32]
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
+mem512_m,zmmreg                           \350\351\361\370\1\x7F\101                AVX512,TFVM
+mem256_m,ymmreg                           \350\361\364\370\1\x7F\101                AVX512,TFVM
 xmmreg_mz,xmmrm                           \350\361\370\1\x6F\110                    AVX512,TFVM
 xmmreg_mz,xmmrm                           \350\361\370\1\x6F\110                    AVX512,TFVM
-xmmrm_mz,xmmreg                           \350\361\370\1\x7F\101                    AVX512,TFVM
+xmmreg_mz,xmmreg                          \350\361\370\1\x7F\101                    AVX512,TFVM
+mem128_m,xmmreg                           \350\361\370\1\x7F\101                    AVX512,TFVM
 ymmreg_mz,ymmrm                           \350\361\364\370\1\x6F\110                AVX512,TFVM
 ymmreg_mz,ymmrm                           \350\361\364\370\1\x6F\110                AVX512,TFVM
-ymmrm_mz,ymmreg                           \350\361\364\370\1\x7F\101                AVX512,TFVM
+ymmreg_mz,ymmreg                          \350\361\364\370\1\x7F\101                AVX512,TFVM
 zmmreg_mz,zmmrm                           \350\351\361\370\1\x6F\110                AVX512,TFVM
 zmmreg_mz,zmmrm                           \350\351\361\370\1\x6F\110                AVX512,TFVM
-zmmrm_mz,zmmreg                           \350\351\361\370\1\x7F\101                AVX512,TFVM
+zmmreg_mz,zmmreg                          \350\351\361\370\1\x7F\101                AVX512,TFVM
 
 
 [VMOVDQA64]
 [VMOVDQA64]
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
+mem512_m,zmmreg                           \350\351\352\361\370\1\x7F\101            AVX512,TFVM
+mem256_m,ymmreg                           \350\352\361\364\370\1\x7F\101            AVX512,TFVM
 xmmreg_mz,xmmrm                           \350\352\361\370\1\x6F\110                AVX512,TFVM
 xmmreg_mz,xmmrm                           \350\352\361\370\1\x6F\110                AVX512,TFVM
-xmmrm_mz,xmmreg                           \350\352\361\370\1\x7F\101                AVX512,TFVM
+xmmreg_mz,xmmreg                          \350\352\361\370\1\x7F\101                AVX512,TFVM
+mem128_m,xmmreg                           \350\352\361\370\1\x7F\101                AVX512,TFVM
 ymmreg_mz,ymmrm                           \350\352\361\364\370\1\x6F\110            AVX512,TFVM
 ymmreg_mz,ymmrm                           \350\352\361\364\370\1\x6F\110            AVX512,TFVM
-ymmrm_mz,ymmreg                           \350\352\361\364\370\1\x7F\101            AVX512,TFVM
+ymmreg_mz,ymmreg                          \350\352\361\364\370\1\x7F\101            AVX512,TFVM
 zmmreg_mz,zmmrm                           \350\351\352\361\370\1\x6F\110            AVX512,TFVM
 zmmreg_mz,zmmrm                           \350\351\352\361\370\1\x6F\110            AVX512,TFVM
-zmmrm_mz,zmmreg                           \350\351\352\361\370\1\x7F\101            AVX512,TFVM
+zmmreg_mz,zmmreg                          \350\351\352\361\370\1\x7F\101            AVX512,TFVM
 
 
 [VMOVDQU16]
 [VMOVDQU16]
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
+mem512_m,zmmreg                           \334\350\351\352\370\1\x7F\101            AVX512,TFVM
+mem256_m,ymmreg                           \334\350\352\364\370\1\x7F\101            AVX512,TFVM
 xmmreg_mz,xmmrm                           \334\350\352\370\1\x6F\110                AVX512,TFVM
 xmmreg_mz,xmmrm                           \334\350\352\370\1\x6F\110                AVX512,TFVM
-xmmrm_mz,xmmreg                           \334\350\352\370\1\x7F\101                AVX512,TFVM
+xmmreg_mz,xmmreg                          \334\350\352\370\1\x7F\101                AVX512,TFVM
+mem128_m,xmmreg                           \334\350\352\370\1\x7F\101                AVX512,TFVM
 ymmreg_mz,ymmrm                           \334\350\352\364\370\1\x6F\110            AVX512,TFVM
 ymmreg_mz,ymmrm                           \334\350\352\364\370\1\x6F\110            AVX512,TFVM
-ymmrm_mz,ymmreg                           \334\350\352\364\370\1\x7F\101            AVX512,TFVM
+ymmreg_mz,ymmreg                          \334\350\352\364\370\1\x7F\101            AVX512,TFVM
 zmmreg_mz,zmmrm                           \334\350\351\352\370\1\x6F\110            AVX512,TFVM
 zmmreg_mz,zmmrm                           \334\350\351\352\370\1\x6F\110            AVX512,TFVM
-zmmrm_mz,zmmreg                           \334\350\351\352\370\1\x7F\101            AVX512,TFVM
+zmmreg_mz,zmmreg                          \334\350\351\352\370\1\x7F\101            AVX512,TFVM
 
 
 [VMOVDQU32]
 [VMOVDQU32]
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
+mem512_m,zmmreg                           \333\350\351\370\1\x7F\101                AVX512,TFVM
+mem256_m,ymmreg                           \333\350\364\370\1\x7F\101                AVX512,TFVM
 xmmreg_mz,xmmrm                           \333\350\370\1\x6F\110                    AVX512,TFVM
 xmmreg_mz,xmmrm                           \333\350\370\1\x6F\110                    AVX512,TFVM
-xmmrm_mz,xmmreg                           \333\350\370\1\x7F\101                    AVX512,TFVM
+xmmreg_mz,xmmreg                          \333\350\370\1\x7F\101                    AVX512,TFVM
+mem128_m,xmmreg                           \333\350\370\1\x7F\101                    AVX512,TFVM
 ymmreg_mz,ymmrm                           \333\350\364\370\1\x6F\110                AVX512,TFVM
 ymmreg_mz,ymmrm                           \333\350\364\370\1\x6F\110                AVX512,TFVM
-ymmrm_mz,ymmreg                           \333\350\364\370\1\x7F\101                AVX512,TFVM
+ymmreg_mz,ymmreg                          \333\350\364\370\1\x7F\101                AVX512,TFVM
 zmmreg_mz,zmmrm                           \333\350\351\370\1\x6F\110                AVX512,TFVM
 zmmreg_mz,zmmrm                           \333\350\351\370\1\x6F\110                AVX512,TFVM
-zmmrm_mz,zmmreg                           \333\350\351\370\1\x7F\101                AVX512,TFVM
+zmmreg_mz,zmmreg                          \333\350\351\370\1\x7F\101                AVX512,TFVM
 
 
 [VMOVDQU64]
 [VMOVDQU64]
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
+mem512_m,zmmreg                           \333\350\351\352\370\1\x7F\101            AVX512,TFVM
+mem256_m,ymmreg                           \333\350\352\364\370\1\x7F\101            AVX512,TFVM
 xmmreg_mz,xmmrm                           \333\350\352\370\1\x6F\110                AVX512,TFVM
 xmmreg_mz,xmmrm                           \333\350\352\370\1\x6F\110                AVX512,TFVM
-xmmrm_mz,xmmreg                           \333\350\352\370\1\x7F\101                AVX512,TFVM
+xmmreg_mz,xmmreg                          \333\350\352\370\1\x7F\101                AVX512,TFVM
+mem128_m,xmmreg                           \333\350\352\370\1\x7F\101                AVX512,TFVM
 ymmreg_mz,ymmrm                           \333\350\352\364\370\1\x6F\110            AVX512,TFVM
 ymmreg_mz,ymmrm                           \333\350\352\364\370\1\x6F\110            AVX512,TFVM
-ymmrm_mz,ymmreg                           \333\350\352\364\370\1\x7F\101            AVX512,TFVM
+ymmreg_mz,ymmreg                          \333\350\352\364\370\1\x7F\101            AVX512,TFVM
 zmmreg_mz,zmmrm                           \333\350\351\352\370\1\x6F\110            AVX512,TFVM
 zmmreg_mz,zmmrm                           \333\350\351\352\370\1\x6F\110            AVX512,TFVM
-zmmrm_mz,zmmreg                           \333\350\351\352\370\1\x7F\101            AVX512,TFVM
+zmmreg_mz,zmmreg                          \333\350\351\352\370\1\x7F\101            AVX512,TFVM
 
 
 [VMOVDQU8]
 [VMOVDQU8]
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
+mem512_m,zmmreg                           \334\350\351\370\1\x7F\101                AVX512,TFVM
+mem256_m,ymmreg                           \334\350\364\370\1\x7F\101                AVX512,TFVM
 xmmreg_mz,xmmrm                           \334\350\370\1\x6F\110                    AVX512,TFVM
 xmmreg_mz,xmmrm                           \334\350\370\1\x6F\110                    AVX512,TFVM
-xmmrm_mz,xmmreg                           \334\350\370\1\x7F\101                    AVX512,TFVM
+xmmreg_mz,xmmreg                          \334\350\370\1\x7F\101                    AVX512,TFVM
+mem128_m,xmmreg                           \334\350\370\1\x7F\101                    AVX512,TFVM
 ymmreg_mz,ymmrm                           \334\350\364\370\1\x6F\110                AVX512,TFVM
 ymmreg_mz,ymmrm                           \334\350\364\370\1\x6F\110                AVX512,TFVM
-ymmrm_mz,ymmreg                           \334\350\364\370\1\x7F\101                AVX512,TFVM
+ymmreg_mz,ymmreg                          \334\350\364\370\1\x7F\101                AVX512,TFVM
 zmmreg_mz,zmmrm                           \334\350\351\370\1\x6F\110                AVX512,TFVM
 zmmreg_mz,zmmrm                           \334\350\351\370\1\x6F\110                AVX512,TFVM
-zmmrm_mz,zmmreg                           \334\350\351\370\1\x7F\101                AVX512,TFVM
+zmmreg_mz,zmmreg                          \334\350\351\370\1\x7F\101                AVX512,TFVM
 
 
 [VPABSQ]
 [VPABSQ]
 (Ch_Wop2, Ch_Rop1)
 (Ch_Wop2, Ch_Rop1)
@@ -9760,27 +9778,27 @@ zmmreg_mz,zmmreg,bmem64                   \350\351\352\361\371\1\x14\75\120
 
 
 [VPSCATTERDD]
 [VPSCATTERDD]
 (Ch_Mop2, Ch_Rop1)
 (Ch_Mop2, Ch_Rop1)
-xmem32_m,xmmreg                           \350\361\371\1\xA0\101                    AVX512,T1S
-ymem32_m,ymmreg                           \350\361\364\371\1\xA0\101                AVX512,T1S
-zmem32_m,zmmreg                           \350\351\361\371\1\xA0\101                AVX512,T1S
+xmem32_m,xmmreg                           \350\361\371\1\xA0\101                    AVX512,T1S,DISTINCT,DALL
+ymem32_m,ymmreg                           \350\361\364\371\1\xA0\101                AVX512,T1S,DISTINCT,DALL
+zmem32_m,zmmreg                           \350\351\361\371\1\xA0\101                AVX512,T1S,DISTINCT,DALL
 
 
 [VPSCATTERDQ]
 [VPSCATTERDQ]
 (Ch_Mop2, Ch_Rop1)
 (Ch_Mop2, Ch_Rop1)
-xmem64_m,xmmreg                           \350\352\361\371\1\xA0\101                AVX512,T1S
-xmem64_m,ymmreg                           \350\352\361\364\371\1\xA0\101            AVX512,T1S
-ymem64_m,zmmreg                           \350\351\352\361\371\1\xA0\101            AVX512,T1S
+xmem64_m,xmmreg                           \350\352\361\371\1\xA0\101                AVX512,T1S,DISTINCT,DALL
+xmem64_m,ymmreg                           \350\352\361\364\371\1\xA0\101            AVX512,T1S,DISTINCT,DALL
+ymem64_m,zmmreg                           \350\351\352\361\371\1\xA0\101            AVX512,T1S,DISTINCT,DALL
 
 
 [VPSCATTERQD]
 [VPSCATTERQD]
 (Ch_Mop2, Ch_Rop1)
 (Ch_Mop2, Ch_Rop1)
-xmem32_m,xmmreg                           \350\361\371\1\xA1\101                    AVX512,T1S
-ymem32_m,xmmreg                           \350\361\364\371\1\xA1\101                AVX512,T1S
-zmem32_m,ymmreg                           \350\351\361\371\1\xA1\101                AVX512,T1S
+xmem32_m,xmmreg                           \350\361\371\1\xA1\101                    AVX512,T1S,DISTINCT,DALL
+ymem32_m,xmmreg                           \350\361\364\371\1\xA1\101                AVX512,T1S,DISTINCT,DALL
+zmem32_m,ymmreg                           \350\351\361\371\1\xA1\101                AVX512,T1S,DISTINCT,DALL
 
 
 [VPSCATTERQQ]
 [VPSCATTERQQ]
 (Ch_Mop2, Ch_Rop1)
 (Ch_Mop2, Ch_Rop1)
-xmem64_m,xmmreg                           \350\352\361\371\1\xA1\101                AVX512,T1S
-ymem64_m,ymmreg                           \350\352\361\364\371\1\xA1\101            AVX512,T1S
-zmem64_m,zmmreg                           \350\351\352\361\371\1\xA1\101            AVX512,T1S
+xmem64_m,xmmreg                           \350\352\361\371\1\xA1\101                AVX512,T1S,DISTINCT,DALL
+ymem64_m,ymmreg                           \350\352\361\364\371\1\xA1\101            AVX512,T1S,DISTINCT,DALL
+zmem64_m,zmmreg                           \350\351\352\361\371\1\xA1\101            AVX512,T1S,DISTINCT,DALL
 
 
 [VPSLLVW]
 [VPSLLVW]
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
 (Ch_Wop3, Ch_Rop2, Ch_Rop1)
@@ -10139,28 +10157,28 @@ xmmreg_mz,xmmreg,xmmreg_er                \350\361\371\1\x2D\75\120
 
 
 [VSCATTERDPD]
 [VSCATTERDPD]
 (Ch_All)
 (Ch_All)
-xmem64_m,xmmreg                           \350\352\361\371\1\xA2\101                AVX512,T1S
-xmem64_m,ymmreg                           \350\352\361\364\371\1\xA2\101            AVX512,T1S
-ymem64_m,zmmreg                           \350\351\352\361\371\1\xA2\101            AVX512,T1S
+xmem64_m,xmmreg                           \350\352\361\371\1\xA2\101                AVX512,T1S,DISTINCT,DALL
+xmem64_m,ymmreg                           \350\352\361\364\371\1\xA2\101            AVX512,T1S,DISTINCT,DALL
+ymem64_m,zmmreg                           \350\351\352\361\371\1\xA2\101            AVX512,T1S,DISTINCT,DALL
 
 
 [VSCATTERDPS]
 [VSCATTERDPS]
 (Ch_All)
 (Ch_All)
-xmem32_m,xmmreg                           \350\361\371\1\xA2\101                    AVX512,T1S
-ymem32_m,ymmreg                           \350\361\364\371\1\xA2\101                AVX512,T1S
-zmem32_m,zmmreg                           \350\351\361\371\1\xA2\101                AVX512,T1S
+xmem32_m,xmmreg                           \350\361\371\1\xA2\101                    AVX512,T1S,DISTINCT,DALL
+ymem32_m,ymmreg                           \350\361\364\371\1\xA2\101                AVX512,T1S,DISTINCT,DALL
+zmem32_m,zmmreg                           \350\351\361\371\1\xA2\101                AVX512,T1S,DISTINCT,DALL
 
 
 
 
 [VSCATTERQPD]
 [VSCATTERQPD]
 (Ch_All)
 (Ch_All)
-xmem64_m,xmmreg                           \350\352\361\371\1\xA3\101                AVX512,T1S
-ymem64_m,ymmreg                           \350\352\361\364\371\1\xA3\101            AVX512,T1S
-zmem64_m,zmmreg                           \350\351\352\361\371\1\xA3\101            AVX512,T1S
+xmem64_m,xmmreg                           \350\352\361\371\1\xA3\101                AVX512,T1S,DISTINCT,DALL
+ymem64_m,ymmreg                           \350\352\361\364\371\1\xA3\101            AVX512,T1S,DISTINCT,DALL
+zmem64_m,zmmreg                           \350\351\352\361\371\1\xA3\101            AVX512,T1S,DISTINCT,DALL
 
 
 [VSCATTERQPS]
 [VSCATTERQPS]
 (Ch_All)
 (Ch_All)
-xmem32_m,xmmreg                           \350\361\371\1\xA3\101                    AVX512,T1S
-ymem32_m,xmmreg                           \350\361\364\371\1\xA3\101                AVX512,T1S
-zmem32_m,ymmreg                           \350\351\361\371\1\xA3\101                AVX512,T1S
+xmem32_m,xmmreg                           \350\361\371\1\xA3\101                    AVX512,T1S,DISTINCT,DALL
+ymem32_m,xmmreg                           \350\361\364\371\1\xA3\101                AVX512,T1S,DISTINCT,DALL
+zmem32_m,ymmreg                           \350\351\361\371\1\xA3\101                AVX512,T1S,DISTINCT,DALL
 
 
 [VSHUFF32X4]
 [VSHUFF32X4]
 (Ch_All)
 (Ch_All)
@@ -10503,13 +10521,92 @@ xmmreg,xmmrm,imm                          \361\3\x0F\x3A\xCE\110\26
 (Ch_Mop2, Ch_Rop1)
 (Ch_Mop2, Ch_Rop1)
 xmmreg,xmmrm                              \361\3\x0F\x38\xCF\110                 GFNI
 xmmreg,xmmrm                              \361\3\x0F\x38\xCF\110                 GFNI
 
 
+;*******************************************************************************
+;********* BF16 ****************************************************************
+;*******************************************************************************
+
+[VCVTNE2PS2BF16]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm                    \350\334\371\1\x72\75\120          AVX512,TFV
+xmmreg_mz,xmmreg,bmem32                   \350\334\371\1\x72\75\120          AVX512,TFV;,BCST8
+ymmreg_mz,ymmreg,ymmrm                    \350\364\334\371\1\x72\75\120      AVX512,TFV
+ymmreg_mz,ymmreg,bmem32                   \350\364\334\371\1\x72\75\120      AVX512,TFV;,BCST16
+zmmreg_mz,zmmreg,zmmrm                    \350\351\334\371\1\x72\75\120      AVX512,TFV
+zmmreg_mz,zmmreg,bmem32                   \350\351\334\371\1\x72\75\120      AVX512,TFV;,BCST32
+
+[VCVTNEPS2BF16,vcvtneps2bf16N]
+(Ch_Wop2, Ch_Rop1)
+ymmreg_mz,mem512                          \350\351\333\371\1\x72\110         AVX512,TFV
+xmmreg_mz,mem256                          \350\364\333\371\1\x72\110         AVX512,TFV
+xmmreg_mz,mem128                          \350\333\371\1\x72\110             AVX512,TFV
+xmmreg_mz,xmmreg                          \350\333\371\1\x72\110             AVX512,TFV
+xmmreg_mz,bmem32                          \350\333\371\1\x72\110             AVX512,T1F32,BCST4
+xmmreg_mz,ymmreg                          \350\364\333\371\1\x72\110         AVX512,TFV
+xmmreg_mz,bmem32                          \350\364\333\371\1\x72\110         AVX512,T1F32,BCST8
+ymmreg_mz,zmmreg                          \350\351\333\371\1\x72\110         AVX512,TFV
+ymmreg_mz,bmem32                          \350\351\333\371\1\x72\110         AVX512,T1F32,BCST16
+
+[VDPBF16PS]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm                    \350\333\371\1\x52\75\120          AVX512,TFV
+xmmreg_mz,xmmreg,bmem32                   \350\333\371\1\x52\75\120          AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm                    \350\364\333\371\1\x52\75\120      AVX512,TFV
+ymmreg_mz,ymmreg,bmem32                   \350\364\333\371\1\x52\75\120      AVX512,TFV
+zmmreg_mz,zmmreg,zmmrm                    \350\351\333\371\1\x52\75\120      AVX512,TFV
+zmmreg_mz,zmmreg,bmem32                   \350\351\333\371\1\x52\75\120      AVX512,TFV
+
+;*******************************************************************************
+;********* 4FMAPS **************************************************************
+;*******************************************************************************
+
+[V4FMADDPS]
+; operand 2 read group of 4 registers
+;(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+(Ch_All)
+zmmreg_mz,zmmreg,memory                   \350\351\334\371\1\x9A\75\120      AVX512,TQVM
+
+[V4FMADDSS]
+; operand 2 read group of 4 registers
+;(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+(Ch_All)
+xmmreg_mz,xmmreg,mem128                   \350\334\371\1\x9B\75\120          AVX512,TFV
+
+[V4FNMADDPS]
+; operand 2 read group of 4 registers
+;(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+(Ch_All)
+zmmreg_mz,zmmreg,memory                   \350\351\334\371\1\xAA\75\120      AVX512,TQVM
+
+[V4FNMADDSS]
+; operand 2 read group of 4 registers
+;(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+(Ch_All)
+xmmreg_mz,xmmreg,mem128                   \350\334\371\1\xAB\75\120          AVX512,TFV
+
+;*******************************************************************************
+;********* 4VNNIW **************************************************************
+;*******************************************************************************
+
+[VP4DPWSSD]
+; operand 2 read group of 4 registers
+;(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+(Ch_All)
+zmmreg_mz,zmmreg,memory                   \350\351\334\371\1\x52\75\120      AVX512,TQVM
+
+[VP4DPWSSDS]
+; operand 2 read group of 4 registers
+;(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+(Ch_All)
+zmmreg_mz,zmmreg,memory                   \350\351\334\371\1\x53\75\120      AVX512,TQVM
+
 ;*******************************************************************************
 ;*******************************************************************************
 ;********* VP2INTERSECT ********************************************************
 ;********* VP2INTERSECT ********************************************************
 ;*******************************************************************************
 ;*******************************************************************************
 
 
 [VP2INTERSECTD]
 [VP2INTERSECTD]
-;-- Write kreg and kreg+1
-(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+;-- Write kreg even-odd pair
+;(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+(Ch_All)
 kreg,xmmreg,xmmrm            \350\334\371\1\x68\75\120               AVX512,TFV
 kreg,xmmreg,xmmrm            \350\334\371\1\x68\75\120               AVX512,TFV
 kreg,xmmreg,bmem32           \350\334\371\1\x68\75\120               AVX512,TFV
 kreg,xmmreg,bmem32           \350\334\371\1\x68\75\120               AVX512,TFV
 kreg,ymmreg,ymmrm            \350\334\364\371\1\x68\75\120           AVX512,TFV
 kreg,ymmreg,ymmrm            \350\334\364\371\1\x68\75\120           AVX512,TFV
@@ -10518,8 +10615,9 @@ kreg,zmmreg,zmmrm            \350\334\351\371\1\x68\75\120           AVX512,TFV
 kreg,zmmreg,bmem32           \350\334\351\371\1\x68\75\120           AVX512,TFV
 kreg,zmmreg,bmem32           \350\334\351\371\1\x68\75\120           AVX512,TFV
 
 
 [VP2INTERSECTQ]
 [VP2INTERSECTQ]
-;-- Write kreg and kreg+1
-(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+;-- Write kreg even-odd pair
+;(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+(Ch_All)
 kreg,xmmreg,xmmrm            \350\352\334\371\1\x68\75\120           AVX512,TFV
 kreg,xmmreg,xmmrm            \350\352\334\371\1\x68\75\120           AVX512,TFV
 kreg,xmmreg,bmem64           \350\352\334\371\1\x68\75\120           AVX512,TFV
 kreg,xmmreg,bmem64           \350\352\334\371\1\x68\75\120           AVX512,TFV
 kreg,ymmreg,ymmrm            \350\352\334\364\371\1\x68\75\120       AVX512,TFV
 kreg,ymmreg,ymmrm            \350\352\334\364\371\1\x68\75\120       AVX512,TFV
@@ -10527,3 +10625,1364 @@ kreg,ymmreg,bmem64           \350\352\334\364\371\1\x68\75\120       AVX512,TFV
 kreg,zmmreg,zmmrm            \350\352\334\351\371\1\x68\75\120       AVX512,TFV
 kreg,zmmreg,zmmrm            \350\352\334\351\371\1\x68\75\120       AVX512,TFV
 kreg,zmmreg,bmem64           \350\352\334\351\371\1\x68\75\120       AVX512,TFV
 kreg,zmmreg,bmem64           \350\352\334\351\371\1\x68\75\120       AVX512,TFV
 
 
+;*******************************************************************************
+;********* FP16 ****************************************************************
+;*******************************************************************************
+
+[VMOVW]
+(Ch_Wop2, Ch_Rop1)
+xmmreg,rm16                    \350\361\375\1\x6E\110          AVX512,T1S
+xmmreg,reg32                   \350\361\375\1\x6E\110          AVX512     ; Gas exepect reg32, while documentation say reg16. Provided for Gas compatibility.
+rm16,xmmreg                    \350\361\375\1\x7E\101          AVX512,T1S
+reg32,xmmreg                   \350\361\375\1\x7E\101          AVX512     ; Gas exepect reg32, while documentation say reg16. Provided for Gas compatibility.
+
+[VMOVSH]
+(Ch_All)
+xmmreg_mz,mem16                \350\333\375\1\x10\110          AVX512,T1S
+xmmreg_mz,xmmreg,xmmreg        \350\333\375\1\x10\75\120       AVX512
+mem16_m,xmmreg                 \350\333\375\1\x11\101          AVX512,T1S
+xmmreg_mz,xmmreg,xmmreg        \350\333\375\1\x11\75\102       AVX512
+
+[VADDPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\375\1\x58\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\375\1\x58\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\364\375\1\x58\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\364\375\1\x58\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\351\375\1\x58\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\351\375\1\x58\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\351\375\1\x58\75\120       AVX512,TFV
+
+[VADDSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\333\375\1\x58\75\120       AVX512
+xmmreg_mz,xmmreg,mem16         \350\333\375\1\x58\75\120       AVX512,T1S
+
+; Psoudo ops for VCMPPH and VCMPSH. Gas provide them, so do we.
+[VCMPEQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x00        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x00        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x00    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x00    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x00    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x00    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x00    AVX512,TFV
+
+[VCMPLTPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x01        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x01        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x01    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x01    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x01    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x01    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x01    AVX512,TFV
+
+[VCMPLEPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x02        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x02        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x02    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x02    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x02    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x02    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x02    AVX512,TFV
+
+[VCMPUNORDPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x03        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x03        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x03    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x03    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x03    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x03    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x03    AVX512,TFV
+
+[VCMPNEQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x04        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x04        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x04    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x04    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x04    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x04    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x04    AVX512,TFV
+
+[VCMPNLTPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x05        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x05        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x05    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x05    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x05    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x05    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x05    AVX512,TFV
+
+[VCMPNLEPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x06        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x06        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x06    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x06    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x06    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x06    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x06    AVX512,TFV
+
+[VCMPORDPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x07        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x07        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x07    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x07    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x07    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x07    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x07    AVX512,TFV
+
+[VCMPEQ_UQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x08        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x08        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x08    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x08    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x08    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x08    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x08    AVX512,TFV
+
+[VCMPNGEPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x09        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x09        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x09    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x09    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x09    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x09    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x09    AVX512,TFV
+
+[VCMPNGTPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x0A        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x0A        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x0A    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x0A    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x0A    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x0A    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x0A    AVX512,TFV
+
+[VCMPFALSEPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x0B        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x0B        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x0B    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x0B    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x0B    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x0B    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x0B    AVX512,TFV
+
+[VCMPNEQ_OQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x0C        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x0C        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x0C    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x0C    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x0C    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x0C    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x0C    AVX512,TFV
+
+[VCMPGEPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x0D        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x0D        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x0D    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x0D    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x0D    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x0D    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x0D    AVX512,TFV
+
+[VCMPGTPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x0E        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x0E        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x0E    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x0E    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x0E    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x0E    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x0E    AVX512,TFV
+
+[VCMPTRUEPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x0F        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x0F        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x0F    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x0F    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x0F    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x0F    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x0F    AVX512,TFV
+
+[VCMPEQ_OSPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x10        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x10        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x10    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x10    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x10    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x10    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x10    AVX512,TFV
+
+[VCMPLT_OQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x11        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x11        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x11    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x11    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x11    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x11    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x11    AVX512,TFV
+
+[VCMPLE_OQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x12        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x12        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x12    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x12    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x12    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x12    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x12    AVX512,TFV
+
+[VCMPUNORD_SPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x13        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x13        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x13    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x13    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x13    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x13    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x13    AVX512,TFV
+
+[VCMPNEQ_USPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x14        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x14        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x14    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x14    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x14    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x14    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x14    AVX512,TFV
+
+[VCMPNLT_UQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x15        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x15        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x15    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x15    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x15    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x15    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x15    AVX512,TFV
+
+[VCMPNLE_UQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x16        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x16        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x16    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x16    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x16    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x16    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x16    AVX512,TFV
+
+[VCMPORD_SPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x17        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x17        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x17    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x17    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x17    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x17    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x17    AVX512,TFV
+
+[VCMPEQ_USPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x18        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x18        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x18    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x18    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x18    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x18    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x18    AVX512,TFV
+
+[VCMPNGE_UQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x19        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x19        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x19    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x19    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x19    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x19    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x19    AVX512,TFV
+
+[VCMPNGT_UQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x1A        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x1A        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x1A    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x1A    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x1A    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x1A    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x1A    AVX512,TFV
+
+[VCMPFALSE_OSPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x1B        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x1B        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x1B    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x1B    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x1B    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x1B    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x1B    AVX512,TFV
+
+[VCMPNEQ_OSPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x1C        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x1C        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x1C    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x1C    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x1C    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x1C    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x1C    AVX512,TFV
+
+[VCMPGE_OQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x1D        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x1D        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x1D    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x1D    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x1D    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x1D    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x1D    AVX512,TFV
+
+[VCMPGT_OQPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x1E        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x1E        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x1E    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x1E    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x1E    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x1E    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x1E    AVX512,TFV
+
+[VCMPTRUE_USPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm         \350\372\1\xC2\75\120\1\x1F        AVX512,TFV
+kreg_m,xmmreg,bmem16        \350\372\1\xC2\75\120\1\x1F        AVX512,TFV
+kreg_m,ymmreg,ymmrm         \350\364\372\1\xC2\75\120\1\x1F    AVX512,TFV
+kreg_m,ymmreg,bmem16        \350\364\372\1\xC2\75\120\1\x1F    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae    \350\351\372\1\xC2\75\120\1\x1F    AVX512
+kreg_m,zmmreg,mem512        \350\351\372\1\xC2\75\120\1\x1F    AVX512,TFV
+kreg_m,zmmreg,bmem16        \350\351\372\1\xC2\75\120\1\x1F    AVX512,TFV
+
+[VCMPEQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x00    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x00    AVX512,T1S
+
+[VCMPLTSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x01    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x01    AVX512,T1S
+
+[VCMPLESH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x02    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x02    AVX512,T1S
+
+[VCMPUNORDSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x03    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x03    AVX512,T1S
+
+[VCMPNEQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x04    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x04    AVX512,T1S
+
+[VCMPNLTSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x05    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x05    AVX512,T1S
+
+[VCMPNLESH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x06    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x06    AVX512,T1S
+
+[VCMPORDSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x07    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x07    AVX512,T1S
+
+[VCMPEQ_UQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x08    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x08    AVX512,T1S
+
+[VCMPNGESH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x09    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x09    AVX512,T1S
+
+[VCMPNGTSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x0A    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x0A    AVX512,T1S
+
+[VCMPFALSESH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x0B    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x0B    AVX512,T1S
+
+[VCMPNEQ_OQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x0C    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x0C    AVX512,T1S
+
+[VCMPGESH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x0D    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x0D    AVX512,T1S
+
+[VCMPGTSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x0E    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x0E    AVX512,T1S
+
+[VCMPTRUESH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x0F    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x0F    AVX512,T1S
+
+[VCMPEQ_OSSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x10    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x10    AVX512,T1S
+
+[VCMPLT_OQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x11    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x11    AVX512,T1S
+
+[VCMPLE_OQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x12    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x12    AVX512,T1S
+
+[VCMPUNORD_SSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x13    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x13    AVX512,T1S
+
+[VCMPNEQ_USSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x14    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x14    AVX512,T1S
+
+[VCMPNLT_UQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x15    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x15    AVX512,T1S
+
+[VCMPNLE_UQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x16    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x16    AVX512,T1S
+
+[VCMPORD_SSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x17    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x17    AVX512,T1S
+
+[VCMPEQ_USSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x18    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x18    AVX512,T1S
+
+[VCMPNGE_UQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x19    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x19    AVX512,T1S
+
+[VCMPNGT_UQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x1A    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x1A    AVX512,T1S
+
+[VCMPFALSE_OSSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x1B    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x1B    AVX512,T1S
+
+[VCMPNEQ_OSSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x1C    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x1C    AVX512,T1S
+
+[VCMPGE_OQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x1D    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x1D    AVX512,T1S
+
+[VCMPGT_OQSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x1E    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x1E    AVX512,T1S
+
+[VCMPTRUE_USSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae    \350\333\372\1\xC2\75\120\1\x1F    AVX512
+kreg_m,xmmreg,mem16         \350\333\372\1\xC2\75\120\1\x1F    AVX512,T1S
+
+; VCMPPH/VCMPSH come after the specific ops.
+[VCMPPH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmrm,imm8       \350\372\1\xC2\75\120\27        AVX512,TFV
+kreg_m,xmmreg,bmem16,imm8      \350\372\1\xC2\75\120\27        AVX512,TFV
+kreg_m,ymmreg,ymmrm,imm8       \350\364\372\1\xC2\75\120\27    AVX512,TFV
+kreg_m,ymmreg,bmem16,imm8      \350\364\372\1\xC2\75\120\27    AVX512,TFV
+kreg_m,zmmreg,zmmreg_sae,imm8  \350\351\372\1\xC2\75\120\27    AVX512
+kreg_m,zmmreg,mem512,imm8      \350\351\372\1\xC2\75\120\27    AVX512,TFV
+kreg_m,zmmreg,bmem16,imm8      \350\351\372\1\xC2\75\120\27    AVX512,TFV
+
+[VCMPSH]
+(Ch_Wop4, Ch_Rop3, Ch_Rop2)
+kreg_m,xmmreg,xmmreg_sae,imm8  \350\333\372\1\xC2\75\120\27    AVX512
+kreg_m,xmmreg,mem16,imm8       \350\333\372\1\xC2\75\120\27    AVX512,T1S
+
+[VCOMISH]
+(Ch_Rop2, Ch_Rop1)
+xmmreg,xmmreg_sae        \350\375\1\x2F\110                  AVX512
+xmmreg,mem16             \350\375\1\x2F\110                  AVX512,T1S
+
+[VCVTDQ2PH,vcvtdq2phN]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,mem256         \350\364\375\1\x5B\110              AVX512,TFV
+xmmreg_mz,xmmrm          \350\375\1\x5B\110                  AVX512,TFV
+xmmreg_mz,bmem32         \350\375\1\x5B\110                  AVX512,T1F32,BCST4
+xmmreg_mz,ymmreg         \350\364\375\1\x5B\110              AVX512,TFV
+xmmreg_mz,bmem32         \350\364\375\1\x5B\110              AVX512,T1F32,BCST8
+ymmreg_mz,zmmreg_er      \350\351\375\1\x5B\110              AVX512
+ymmreg_mz,mem512         \350\351\375\1\x5B\110              AVX512,TFV
+ymmreg_mz,bmem32         \350\351\375\1\x5B\110              AVX512,T1F32,BCST16
+
+[VCVTPD2PH,vcvtpd2phS]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,mem512         \350\352\351\361\375\1\x5A\110      AVX512,TFV
+xmmreg_mz,mem256         \350\352\364\361\375\1\x5A\110      AVX512,TFV
+xmmreg_mz,xmmrm          \350\352\361\375\1\x5A\110          AVX512,TFV
+xmmreg_mz,bmem64         \350\352\361\375\1\x5A\110          AVX512,T1F64,BCST2
+xmmreg_mz,ymmreg         \350\352\364\361\375\1\x5A\110      AVX512,TFV
+xmmreg_mz,bmem64         \350\352\364\361\375\1\x5A\110      AVX512,T1F64,BCST4
+xmmreg_mz,zmmreg_er      \350\352\351\361\375\1\x5A\110      AVX512
+xmmreg_mz,bmem64         \350\352\351\361\375\1\x5A\110      AVX512,T1F64,BCST8
+
+[VCVTPH2DQ]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem256         \350\351\361\375\1\x5B\110          AVX512,THV
+ymmreg_mz,mem128         \350\364\361\375\1\x5B\110          AVX512,THV
+xmmreg_mz,xmmreg         \350\361\375\1\x5B\110              AVX512,THV
+xmmreg_mz,mem64          \350\361\375\1\x5B\110              AVX512,THV
+xmmreg_mz,bmem16         \350\361\375\1\x5B\110              AVX512,T1S,BCST4
+ymmreg_mz,xmmreg         \350\364\361\375\1\x5B\110          AVX512,THV
+ymmreg_mz,bmem16         \350\364\361\375\1\x5B\110          AVX512,T1S,BCST8
+zmmreg_mz,ymmreg_er      \350\351\361\375\1\x5B\110          AVX512
+zmmreg_mz,bmem16         \350\351\361\375\1\x5B\110          AVX512,T1S,BCST16
+
+[VCVTPH2PD]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem128         \350\351\375\1\x5A\110              AVX512,TQVM
+ymmreg_mz,mem64          \350\364\375\1\x5A\110              AVX512,TQVM
+xmmreg_mz,xmmreg         \350\375\1\x5A\110                  AVX512,TQVM
+xmmreg_mz,mem32          \350\375\1\x5A\110                  AVX512,TQVM
+xmmreg_mz,bmem16         \350\375\1\x5A\110                  AVX512,T1S,BCST2
+ymmreg_mz,xmmreg         \350\364\375\1\x5A\110              AVX512,TQVM
+ymmreg_mz,bmem16         \350\364\375\1\x5A\110              AVX512,T1S,BCST4
+zmmreg_mz,xmmreg_sae     \350\351\375\1\x5A\110              AVX512
+zmmreg_mz,bmem16         \350\351\375\1\x5A\110              AVX512,T1S,BCST8
+
+; - see as well VCVTPH2PS
+[VCVTPH2PSX]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem256         \350\361\351\376\1\x13\110          AVX512,THV
+ymmreg_mz,mem128         \350\361\364\376\1\x13\110          AVX512,THV
+xmmreg_mz,xmmreg         \350\361\376\1\x13\110              AVX512,THV
+xmmreg_mz,mem64          \350\361\376\1\x13\110              AVX512,THV
+xmmreg_mz,bmem16         \350\361\376\1\x13\110              AVX512,T1S,BCST4
+ymmreg_mz,xmmreg         \350\361\364\376\1\x13\110          AVX512,THV
+ymmreg_mz,bmem16         \350\361\364\376\1\x13\110          AVX512,T1S,BCST8
+zmmreg_mz,ymmreg_sae     \350\361\351\376\1\x13\110          AVX512
+zmmreg_mz,bmem16         \350\361\351\376\1\x13\110          AVX512,T1S,BCST16
+
+[VCVTPH2QQ]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem128         \350\361\351\375\1\x7B\110          AVX512,TQVM
+ymmreg_mz,mem64          \350\361\364\375\1\x7B\110          AVX512,TQVM
+xmmreg_mz,xmmreg         \350\361\375\1\x7B\110              AVX512,TQVM
+xmmreg_mz,mem32          \350\361\375\1\x7B\110              AVX512,TQVM
+xmmreg_mz,bmem16         \350\361\375\1\x7B\110              AVX512,T1S,BCST2
+ymmreg_mz,xmmreg         \350\361\364\375\1\x7B\110          AVX512,TQVM
+ymmreg_mz,bmem16         \350\361\364\375\1\x7B\110          AVX512,T1S,BCST4
+zmmreg_mz,xmmreg_er      \350\361\351\375\1\x7B\110          AVX512
+zmmreg_mz,bmem16         \350\361\351\375\1\x7B\110          AVX512,T1S,BCST8
+
+[VCVTPH2UDQ]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem256         \350\351\375\1\x79\110              AVX512,THV
+ymmreg_mz,mem128         \350\364\375\1\x79\110              AVX512,THV
+xmmreg_mz,xmmreg         \350\375\1\x79\110                  AVX512,THV
+xmmreg_mz,mem64          \350\375\1\x79\110                  AVX512,THV
+xmmreg_mz,bmem16         \350\375\1\x79\110                  AVX512,T1S,BCST4
+ymmreg_mz,xmmreg         \350\364\375\1\x79\110              AVX512,THV
+ymmreg_mz,bmem16         \350\364\375\1\x79\110              AVX512,T1S,BCST8
+zmmreg_mz,ymmreg_er      \350\351\375\1\x79\110              AVX512
+zmmreg_mz,bmem16         \350\351\375\1\x79\110              AVX512,T1S,BCST16
+
+[VCVTPH2UQQ]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem128         \350\361\351\375\1\x79\110          AVX512,TQVM
+ymmreg_mz,mem64          \350\361\364\375\1\x79\110          AVX512,TQVM
+xmmreg_mz,xmmreg         \350\361\375\1\x79\110              AVX512,TQVM
+xmmreg_mz,mem32          \350\361\375\1\x79\110              AVX512,TQVM
+xmmreg_mz,bmem16         \350\361\375\1\x79\110              AVX512,T1S,BCST2
+ymmreg_mz,xmmreg         \350\361\364\375\1\x79\110          AVX512,TQVM
+ymmreg_mz,bmem16         \350\361\364\375\1\x79\110          AVX512,T1S,BCST4
+zmmreg_mz,xmmreg_er      \350\361\351\375\1\x79\110          AVX512
+zmmreg_mz,bmem16         \350\361\351\375\1\x79\110          AVX512,T1S,BCST8
+
+[VCVTPH2UW]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm          \350\375\1\x7D\110                  AVX512,TFV
+xmmreg_mz,bmem16         \350\375\1\x7D\110                  AVX512,TFV
+ymmreg_mz,ymmrm          \350\364\375\1\x7D\110              AVX512,TFV
+ymmreg_mz,bmem16         \350\364\375\1\x7D\110              AVX512,TFV
+zmmreg_mz,zmmreg_er      \350\351\375\1\x7D\110              AVX512
+zmmreg_mz,mem512         \350\351\375\1\x7D\110              AVX512,TFV
+zmmreg_mz,bmem16         \350\351\375\1\x7D\110              AVX512,TFV
+
+[VCVTPH2W]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm          \350\361\375\1\x7D\110              AVX512,TFV
+xmmreg_mz,bmem16         \350\361\375\1\x7D\110              AVX512,TFV
+ymmreg_mz,ymmrm          \350\361\364\375\1\x7D\110          AVX512,TFV
+ymmreg_mz,bmem16         \350\361\364\375\1\x7D\110          AVX512,TFV
+zmmreg_mz,zmmreg_er      \350\361\351\375\1\x7D\110          AVX512
+zmmreg_mz,mem512         \350\361\351\375\1\x7D\110          AVX512,TFV
+zmmreg_mz,bmem16         \350\361\351\375\1\x7D\110          AVX512,TFV
+
+[VCVTPS2PHX,vcvtps2phxN]
+(Ch_Wop2, Ch_Rop1)
+ymmreg_mz,mem512         \350\361\351\375\1\x1D\110          AVX512,TFV
+xmmreg_mz,mem256         \350\361\364\375\1\x1D\110          AVX512,TFV
+xmmreg_mz,xmmrm          \350\361\375\1\x1D\110              AVX512,TFV
+xmmreg_mz,bmem32         \350\361\375\1\x1D\110              AVX512,T1F32,BCST4
+xmmreg_mz,ymmreg         \350\361\364\375\1\x1D\110          AVX512,TFV
+xmmreg_mz,bmem32         \350\361\364\375\1\x1D\110          AVX512,T1F32,BCST8
+ymmreg_mz,zmmreg_er      \350\361\351\375\1\x1D\110          AVX512
+ymmreg_mz,bmem32         \350\361\351\375\1\x1D\110          AVX512,T1F32,BCST16
+
+[VCVTQQ2PH,vcvtqq2phS]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,mem512         \350\352\351\375\1\x5B\110          AVX512,TFV
+xmmreg_mz,mem256         \350\352\364\375\1\x5B\110          AVX512,TFV
+xmmreg_mz,xmmrm          \350\352\375\1\x5B\110              AVX512,TFV
+xmmreg_mz,bmem64         \350\352\375\1\x5B\110              AVX512,T1F64,BCST2
+xmmreg_mz,ymmreg         \350\352\364\375\1\x5B\110          AVX512,TFV
+xmmreg_mz,bmem64         \350\352\364\375\1\x5B\110          AVX512,T1F64,BCST4
+xmmreg_mz,zmmreg_er      \350\352\351\375\1\x5B\110          AVX512
+xmmreg_mz,bmem64         \350\352\351\375\1\x5B\110          AVX512,T1F64,BCST8
+
+[VCVTSD2SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er   \350\352\334\375\1\x5A\75\120   AVX512
+xmmreg_mz,xmmreg,mem64       \350\352\334\375\1\x5A\75\120   AVX512,T1F64
+
+[VCVTSH2SD]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_sae  \350\333\375\1\x5A\75\120       AVX512
+xmmreg_mz,xmmreg,mem16       \350\333\375\1\x5A\75\120       AVX512,T1S
+
+[VCVTSH2SI]
+(Ch_Wop2, Ch_Rop1)
+reg32,xmmreg_er          \350\333\375\1\x2D\110              AVX512
+reg32,mem16              \350\333\375\1\x2D\110              AVX512,T1S
+reg64,xmmreg_er          \350\352\333\375\1\x2D\110          AVX512,X86_64
+reg64,mem16              \350\352\333\375\1\x2D\110          AVX512,T1S,X86_64
+
+[VCVTSH2SS]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_sae    \350\376\1\x13\75\120         AVX512
+xmmreg_mz,xmmreg,mem16         \350\376\1\x13\75\120         AVX512,T1S
+
+[VCVTSH2USI]
+(Ch_Wop2, Ch_Rop1)
+reg32,xmmreg_er          \350\333\375\1\x79\110              AVX512
+reg32,mem16              \350\333\375\1\x79\110              AVX512,T1S
+reg64,xmmreg_er          \350\352\333\375\1\x79\110          AVX512,X86_64
+reg64,mem16              \350\352\333\375\1\x79\110          AVX512,T1S,X86_64
+
+[VCVTSI2SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg,xmmreg_er,reg32   \350\333\375\1\x2A\75\120           AVX512
+xmmreg,xmmreg,mem32      \350\333\375\1\x2A\75\120           AVX512,T1S
+xmmreg,xmmreg_er,reg64   \350\352\333\375\1\x2A\75\120       AVX512,X86_64
+xmmreg,xmmreg,mem64      \350\352\333\375\1\x2A\75\120       AVX512,T1S,X86_64
+
+[VCVTSS2SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er  \350\375\1\x1D\75\120            AVX512
+xmmreg_mz,xmmreg,mem32      \350\375\1\x1D\75\120            AVX512,T1S
+
+[VCVTTPH2DQ]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem256         \350\333\351\375\1\x5B\110          AVX512,THV
+ymmreg_mz,mem128         \350\333\364\375\1\x5B\110          AVX512,THV
+xmmreg_mz,xmmreg         \350\333\375\1\x5B\110              AVX512,THV
+xmmreg_mz,mem64          \350\333\375\1\x5B\110              AVX512,THV
+xmmreg_mz,bmem16         \350\333\375\1\x5B\110              AVX512,T1S,BCST4
+ymmreg_mz,xmmreg         \350\333\364\375\1\x5B\110          AVX512,THV
+ymmreg_mz,bmem16         \350\333\364\375\1\x5B\110          AVX512,T1S,BCST8
+zmmreg_mz,ymmreg_sae     \350\333\351\375\1\x5B\110          AVX512
+zmmreg_mz,bmem16         \350\333\351\375\1\x5B\110          AVX512,T1S,BCST16
+
+[VCVTTPH2QQ]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem128         \350\361\351\375\1\x7A\110          AVX512,TQVM
+ymmreg_mz,mem64          \350\361\364\375\1\x7A\110          AVX512,TQVM
+xmmreg_mz,xmmreg         \350\361\375\1\x7A\110              AVX512,TQVM
+xmmreg_mz,mem32          \350\361\375\1\x7A\110              AVX512,TQVM
+xmmreg_mz,bmem16         \350\361\375\1\x7A\110              AVX512,T1S,BCST2
+ymmreg_mz,xmmreg         \350\361\364\375\1\x7A\110          AVX512,TQVM
+ymmreg_mz,bmem16         \350\361\364\375\1\x7A\110          AVX512,T1S,BCST4
+zmmreg_mz,xmmreg_sae     \350\361\351\375\1\x7A\110          AVX512
+zmmreg_mz,bmem16         \350\361\351\375\1\x7A\110          AVX512,T1S,BCST8
+
+[VCVTTPH2UDQ]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem256         \350\351\375\1\x78\110              AVX512,THV
+ymmreg_mz,mem128         \350\364\375\1\x78\110              AVX512,THV
+xmmreg_mz,xmmreg         \350\375\1\x78\110                  AVX512,THV
+xmmreg_mz,mem64          \350\375\1\x78\110                  AVX512,THV
+xmmreg_mz,bmem16         \350\375\1\x78\110                  AVX512,T1S,BCST4
+ymmreg_mz,xmmreg         \350\364\375\1\x78\110              AVX512,THV
+ymmreg_mz,bmem16         \350\364\375\1\x78\110              AVX512,T1S,BCST8
+zmmreg_mz,ymmreg_sae     \350\351\375\1\x78\110              AVX512
+zmmreg_mz,bmem16         \350\351\375\1\x78\110              AVX512,T1S,BCST16
+
+[VCVTTPH2UQQ]
+(Ch_Wop2, Ch_Rop1)
+zmmreg_mz,mem128         \350\361\351\375\1\x78\110          AVX512,TQVM
+ymmreg_mz,mem64          \350\361\364\375\1\x78\110          AVX512,TQVM
+xmmreg_mz,xmmreg         \350\361\375\1\x78\110              AVX512,TQVM
+xmmreg_mz,mem32          \350\361\375\1\x78\110              AVX512,TQVM
+xmmreg_mz,bmem16         \350\361\375\1\x78\110              AVX512,T1S,BCST2
+ymmreg_mz,xmmreg         \350\361\364\375\1\x78\110          AVX512,TQVM
+ymmreg_mz,bmem16         \350\361\364\375\1\x78\110          AVX512,T1S,BCST4
+zmmreg_mz,xmmreg_sae     \350\361\351\375\1\x78\110          AVX512
+zmmreg_mz,bmem16         \350\361\351\375\1\x78\110          AVX512,T1S,BCST8
+
+[VCVTTPH2UW]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm          \350\375\1\x7C\110                  AVX512,TFV
+xmmreg_mz,bmem16         \350\375\1\x7C\110                  AVX512,TFV
+ymmreg_mz,ymmrm          \350\364\375\1\x7C\110              AVX512,TFV
+ymmreg_mz,bmem16         \350\364\375\1\x7C\110              AVX512,TFV
+zmmreg_mz,zmmreg_sae     \350\351\375\1\x7C\110              AVX512
+zmmreg_mz,mem512         \350\351\375\1\x7C\110              AVX512,TFV
+zmmreg_mz,bmem16         \350\351\375\1\x7C\110              AVX512,TFV
+
+[VCVTTPH2W]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm          \350\361\375\1\x7C\110              AVX512,TFV
+xmmreg_mz,bmem16         \350\361\375\1\x7C\110              AVX512,TFV
+ymmreg_mz,ymmrm          \350\361\364\375\1\x7C\110          AVX512,TFV
+ymmreg_mz,bmem16         \350\361\364\375\1\x7C\110          AVX512,TFV
+zmmreg_mz,zmmreg_sae     \350\361\351\375\1\x7C\110          AVX512
+zmmreg_mz,mem512         \350\361\351\375\1\x7C\110          AVX512,TFV
+zmmreg_mz,bmem16         \350\361\351\375\1\x7C\110          AVX512,TFV
+
+[VCVTTSH2SI]
+(Ch_Wop2, Ch_Rop1)
+reg32,xmmreg_sae         \350\333\375\1\x2C\110              AVX512
+reg32,mem16              \350\333\375\1\x2C\110              AVX512,T1S
+reg64,xmmreg_sae         \350\352\333\375\1\x2C\110          AVX512,X86_64
+reg64,mem16              \350\352\333\375\1\x2C\110          AVX512,T1S,X86_64
+
+[VCVTTSH2USI]
+(Ch_Wop2, Ch_Rop1)
+reg32,xmmreg_sae         \350\333\375\1\x78\110              AVX512
+reg32,mem16              \350\333\375\1\x78\110              AVX512,T1S
+reg64,xmmreg_sae         \350\352\333\375\1\x78\110          AVX512,X86_64
+reg64,mem16              \350\352\333\375\1\x78\110          AVX512,T1S,X86_64
+
+[VCVTUDQ2PH,vcvtudq2phN]
+(Ch_Wop2, Ch_Rop1)
+ymmreg_mz,mem512         \350\334\351\375\1\x7A\110          AVX512,TFV
+xmmreg_mz,mem256         \350\334\364\375\1\x7A\110          AVX512,TFV
+xmmreg_mz,xmmrm          \350\334\375\1\x7A\110              AVX512,TFV
+xmmreg_mz,bmem32         \350\334\375\1\x7A\110              AVX512,T1F32,BCST4
+xmmreg_mz,ymmreg         \350\334\364\375\1\x7A\110          AVX512,TFV
+xmmreg_mz,bmem32         \350\334\364\375\1\x7A\110          AVX512,T1F32,BCST8
+ymmreg_mz,zmmreg_er      \350\334\351\375\1\x7A\110          AVX512
+ymmreg_mz,bmem32         \350\334\351\375\1\x7A\110          AVX512,T1F32,BCST16
+
+[VCVTUQQ2PH,vcvtuqq2phS]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,mem512         \350\352\334\351\375\1\x7A\110      AVX512,TFV
+xmmreg_mz,mem256         \350\352\334\364\375\1\x7A\110      AVX512,TFV
+xmmreg_mz,xmmrm          \350\352\334\375\1\x7A\110          AVX512,TFV
+xmmreg_mz,bmem64         \350\352\334\375\1\x7A\110          AVX512,T1F64,BCST2
+xmmreg_mz,ymmreg         \350\352\334\364\375\1\x7A\110      AVX512,TFV
+xmmreg_mz,bmem64         \350\352\334\364\375\1\x7A\110      AVX512,T1F64,BCST4
+xmmreg_mz,zmmreg_er      \350\352\334\351\375\1\x7A\110      AVX512
+xmmreg_mz,bmem64         \350\352\334\351\375\1\x7A\110      AVX512,T1F64,BCST8
+
+
+[VCVTUSI2SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg,xmmreg_er,reg32   \350\333\375\1\x7B\75\120           AVX512
+xmmreg,xmmreg,mem32      \350\333\375\1\x7B\75\120           AVX512,T1S
+xmmreg,xmmreg_er,reg64   \350\352\333\375\1\x7B\75\120       AVX512,X86_64
+xmmreg,xmmreg,mem64      \350\352\333\375\1\x7B\75\120       AVX512,T1S,X86_64
+
+
+[VCVTUW2PH]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm          \350\334\375\1\x7D\110              AVX512,TFV
+xmmreg_mz,bmem16         \350\334\375\1\x7D\110              AVX512,TFV
+ymmreg_mz,ymmrm          \350\334\364\375\1\x7D\110          AVX512,TFV
+ymmreg_mz,bmem16         \350\334\364\375\1\x7D\110          AVX512,TFV
+zmmreg_mz,zmmreg_er      \350\334\351\375\1\x7D\110          AVX512
+zmmreg_mz,mem512         \350\334\351\375\1\x7D\110          AVX512,TFV
+zmmreg_mz,bmem16         \350\334\351\375\1\x7D\110          AVX512,TFV
+
+[VCVTW2PH]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm          \350\333\375\1\x7D\110              AVX512,TFV
+xmmreg_mz,bmem16         \350\333\375\1\x7D\110              AVX512,TFV
+ymmreg_mz,ymmrm          \350\333\364\375\1\x7D\110          AVX512,TFV
+ymmreg_mz,bmem16         \350\333\364\375\1\x7D\110          AVX512,TFV
+zmmreg_mz,zmmreg_er      \350\333\351\375\1\x7D\110          AVX512
+zmmreg_mz,mem512         \350\333\351\375\1\x7D\110          AVX512,TFV
+zmmreg_mz,bmem16         \350\333\351\375\1\x7D\110          AVX512,TFV
+
+[VDIVPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\375\1\x5E\75\120               AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\375\1\x5E\75\120               AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\364\375\1\x5E\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\364\375\1\x5E\75\120           AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\351\375\1\x5E\75\120           AVX512
+zmmreg_mz,zmmreg,mem512        \350\351\375\1\x5E\75\120           AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\351\375\1\x5E\75\120           AVX512,TFV
+
+[VDIVSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\333\375\1\x5E\75\120           AVX512
+xmmreg_mz,xmmreg,mem16         \350\333\375\1\x5E\75\120           AVX512,T1S
+
+[VFCMADDCPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\334\376\1\x56\75\120           AVX512,DISTINCT,TFV
+xmmreg_mz,xmmreg,bmem32        \350\334\376\1\x56\75\120           AVX512,DISTINCT,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\334\364\376\1\x56\75\120       AVX512,DISTINCT,TFV
+ymmreg_mz,ymmreg,bmem32        \350\334\364\376\1\x56\75\120       AVX512,DISTINCT,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\334\351\376\1\x56\75\120       AVX512,DISTINCT
+zmmreg_mz,zmmreg,mem512        \350\334\351\376\1\x56\75\120       AVX512,DISTINCT,TFV
+zmmreg_mz,zmmreg,bmem32        \350\334\351\376\1\x56\75\120       AVX512,DISTINCT,TFV
+
+[VFCMADDCSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\334\376\1\x57\75\120           AVX512,DISTINCT
+xmmreg_mz,xmmreg,mem32         \350\334\376\1\x57\75\120           AVX512,DISTINCT,T1S
+
+[VFMADDCPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\333\376\1\x56\75\120           AVX512,DISTINCT,TFV
+xmmreg_mz,xmmreg,bmem32        \350\333\376\1\x56\75\120           AVX512,DISTINCT,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\333\364\376\1\x56\75\120       AVX512,DISTINCT,TFV
+ymmreg_mz,ymmreg,bmem32        \350\333\364\376\1\x56\75\120       AVX512,DISTINCT,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\333\351\376\1\x56\75\120       AVX512,DISTINCT
+zmmreg_mz,zmmreg,mem512        \350\333\351\376\1\x56\75\120       AVX512,DISTINCT,TFV
+zmmreg_mz,zmmreg,bmem32        \350\333\351\376\1\x56\75\120       AVX512,DISTINCT,TFV
+
+[VFMADDCSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\333\376\1\x57\75\120           AVX512,DISTINCT
+xmmreg_mz,xmmreg,mem32         \350\333\376\1\x57\75\120           AVX512,DISTINCT,T1S
+
+[VFCMULCPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\334\376\1\xD6\75\120           AVX512,DISTINCT,TFV
+xmmreg_mz,xmmreg,bmem32        \350\334\376\1\xD6\75\120           AVX512,DISTINCT,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\334\364\376\1\xD6\75\120       AVX512,DISTINCT,TFV
+ymmreg_mz,ymmreg,bmem32        \350\334\364\376\1\xD6\75\120       AVX512,DISTINCT,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\334\351\376\1\xD6\75\120       AVX512,DISTINCT
+zmmreg_mz,zmmreg,mem512        \350\334\351\376\1\xD6\75\120       AVX512,DISTINCT,TFV
+zmmreg_mz,zmmreg,bmem32        \350\334\351\376\1\xD6\75\120       AVX512,DISTINCT,TFV
+
+[VFCMULCSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\334\376\1\xD7\75\120           AVX512,DISTINCT
+xmmreg_mz,xmmreg,mem32         \350\334\376\1\xD7\75\120           AVX512,DISTINCT,T1S
+
+[VFMULCPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\333\376\1\xD6\75\120           AVX512,DISTINCT,TFV
+xmmreg_mz,xmmreg,bmem32        \350\333\376\1\xD6\75\120           AVX512,DISTINCT,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\333\364\376\1\xD6\75\120       AVX512,DISTINCT,TFV
+ymmreg_mz,ymmreg,bmem32        \350\333\364\376\1\xD6\75\120       AVX512,DISTINCT,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\333\351\376\1\xD6\75\120       AVX512,DISTINCT
+zmmreg_mz,zmmreg,mem512        \350\333\351\376\1\xD6\75\120       AVX512,DISTINCT,TFV
+zmmreg_mz,zmmreg,bmem32        \350\333\351\376\1\xD6\75\120       AVX512,DISTINCT,TFV
+
+[VFMULCSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\333\376\1\xD7\75\120           AVX512,DISTINCT
+xmmreg_mz,xmmreg,mem32         \350\333\376\1\xD7\75\120           AVX512,DISTINCT,T1S
+
+[VFMADDSUB132PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\x96\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\x96\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\x96\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\x96\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\x96\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\x96\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\x96\75\120       AVX512,TFV
+
+[VFMADDSUB213PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xA6\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xA6\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xA6\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xA6\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xA6\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xA6\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xA6\75\120       AVX512,TFV
+
+[VFMADDSUB231PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xB6\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xB6\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xB6\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xB6\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xB6\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xB6\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xB6\75\120       AVX512,TFV
+
+[VFMSUBADD132PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\x97\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\x97\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\x97\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\x97\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\x97\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\x97\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\x97\75\120       AVX512,TFV
+
+[VFMSUBADD213PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xA7\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xA7\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xA7\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xA7\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xA7\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xA7\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xA7\75\120       AVX512,TFV
+
+[VFMSUBADD231PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xB7\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xB7\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xB7\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xB7\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xB7\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xB7\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xB7\75\120       AVX512,TFV
+
+[VFMADD132PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\x98\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\x98\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\x98\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\x98\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\x98\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\x98\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\x98\75\120       AVX512,TFV
+
+[VFMADD213PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xA8\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xA8\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xA8\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xA8\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xA8\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xA8\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xA8\75\120       AVX512,TFV
+
+[VFMADD231PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xB8\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xB8\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xB8\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xB8\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xB8\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xB8\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xB8\75\120       AVX512,TFV
+
+[VFNMADD132PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\x9C\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\x9C\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\x9C\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\x9C\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\x9C\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\x9C\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\x9C\75\120       AVX512,TFV
+
+[VFNMADD213PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xAC\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xAC\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xAC\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xAC\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xAC\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xAC\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xAC\75\120       AVX512,TFV
+
+[VFNMADD231PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xBC\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xBC\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xBC\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xBC\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xBC\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xBC\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xBC\75\120       AVX512,TFV
+
+[VFMADD132SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\361\376\1\x99\75\120           AVX512
+xmmreg_mz,xmmreg,mem16         \350\361\376\1\x99\75\120           AVX512,T1S
+
+[VFMADD213SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\361\376\1\xA9\75\120           AVX512
+xmmreg_mz,xmmreg,mem16         \350\361\376\1\xA9\75\120           AVX512,T1S
+
+[VFMADD231SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\361\376\1\xB9\75\120           AVX512
+xmmreg_mz,xmmreg,mem16         \350\361\376\1\xB9\75\120           AVX512,T1S
+
+[VFNMADD132SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\361\376\1\x9D\75\120           AVX512
+xmmreg_mz,xmmreg,mem16         \350\361\376\1\x9D\75\120           AVX512,T1S
+
+[VFNMADD213SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\361\376\1\xAD\75\120           AVX512
+xmmreg_mz,xmmreg,mem16         \350\361\376\1\xAD\75\120           AVX512,T1S
+
+[VFNMADD231SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er     \350\361\376\1\xBD\75\120           AVX512
+xmmreg_mz,xmmreg,mem16         \350\361\376\1\xBD\75\120           AVX512,T1S
+
+[VFMSUB132PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\x9A\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\x9A\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\x9A\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\x9A\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\x9A\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\x9A\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\x9A\75\120       AVX512,TFV
+
+[VFMSUB213PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xAA\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xAA\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xAA\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xAA\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xAA\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xAA\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xAA\75\120       AVX512,TFV
+
+[VFMSUB231PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xBA\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xBA\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xBA\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xBA\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xBA\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xBA\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xBA\75\120       AVX512,TFV
+
+[VFNMSUB132PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\x9E\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\x9E\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\x9E\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\x9E\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\x9E\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\x9E\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\x9E\75\120       AVX512,TFV
+
+[VFNMSUB213PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xAE\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xAE\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xAE\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xAE\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xAE\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xAE\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xAE\75\120       AVX512,TFV
+
+[VFNMSUB231PH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm         \350\361\376\1\xBE\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16        \350\361\376\1\xBE\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm         \350\361\364\376\1\xBE\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16        \350\361\364\376\1\xBE\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er     \350\361\351\376\1\xBE\75\120       AVX512
+zmmreg_mz,zmmreg,mem512        \350\361\351\376\1\xBE\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16        \350\361\351\376\1\xBE\75\120       AVX512,TFV
+
+[VFMSUB132SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\361\376\1\x9B\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\x9B\75\120       AVX512,T1S
+
+[VFMSUB213SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\361\376\1\xAB\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\xAB\75\120       AVX512,T1S
+
+[VFMSUB231SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\361\376\1\xBB\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\xBB\75\120       AVX512,T1S
+
+[VFNMSUB132SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\361\376\1\x9F\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\x9F\75\120       AVX512,T1S
+
+[VFNMSUB213SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\361\376\1\xAF\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\xAF\75\120       AVX512,T1S
+
+[VFNMSUB231SH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\361\376\1\xBF\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\xBF\75\120       AVX512,T1S
+
+[VFPCLASSPH,vfpclassphS]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+kreg_m,mem256,imm8            \350\364\372\1\x66\110\26       AVX512,TFV
+kreg_m,mem512,imm8            \350\351\372\1\x66\110\26       AVX512,TFV
+kreg_m,xmmrm,imm8             \350\372\1\x66\110\26           AVX512,TFV
+kreg_m,bmem16,imm8            \350\372\1\x66\110\26           AVX512,T1S,BCST8
+kreg_m,ymmreg,imm8            \350\364\372\1\x66\110\26       AVX512
+kreg_m,bmem16,imm8            \350\364\372\1\x66\110\26       AVX512,T1S,BCST16
+kreg_m,zmmreg,imm8            \350\351\372\1\x66\110\26       AVX512
+kreg_m,bmem16,imm8            \350\351\372\1\x66\110\26       AVX512,T1S,BCST32
+
+[VFPCLASSSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+kreg_m,xmmreg,imm8            \350\372\1\x67\110\26           AVX512
+kreg_m,mem16,imm8             \350\372\1\x67\110\26           AVX512,T1S
+
+[VGETEXPPH]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm               \350\361\376\1\x42\110          AVX512,TFV
+xmmreg_mz,bmem16              \350\361\376\1\x42\110          AVX512,TFV
+ymmreg_mz,ymmrm               \350\361\364\376\1\x42\110      AVX512,TFV
+ymmreg_mz,bmem16              \350\361\364\376\1\x42\110      AVX512,TFV
+zmmreg_mz,zmmreg_sae          \350\361\351\376\1\x42\110      AVX512
+zmmreg_mz,mem512              \350\361\351\376\1\x42\110      AVX512,TFV
+zmmreg_mz,bmem16              \350\361\351\376\1\x42\110      AVX512,TFV
+
+[VGETEXPSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_sae   \350\361\376\1\x43\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\x43\75\120       AVX512,T1S
+
+[VGETMANTPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmrm,imm8          \350\372\1\x26\110\26           AVX512,TFV
+xmmreg_mz,bmem16,imm8         \350\372\1\x26\110\26           AVX512,TFV
+ymmreg_mz,ymmrm,imm8          \350\364\372\1\x26\110\26       AVX512,TFV
+ymmreg_mz,bmem16,imm8         \350\364\372\1\x26\110\26       AVX512,TFV
+zmmreg_mz,zmmreg_sae,imm8     \350\351\372\1\x26\110\26       AVX512
+zmmreg_mz,mem512,imm8         \350\351\372\1\x26\110\26       AVX512,TFV
+zmmreg_mz,bmem16,imm8         \350\351\372\1\x26\110\26       AVX512,T1S
+
+[VGETMANTSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_sae,imm8  \350\372\1\x27\75\120\27    AVX512
+xmmreg_mz,xmmreg,mem16,imm8       \350\372\1\x27\75\120\27    AVX512,T1S
+
+[VMAXPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm        \350\375\1\x5F\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16       \350\375\1\x5F\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm        \350\364\375\1\x5F\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16       \350\364\375\1\x5F\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_sae   \350\351\375\1\x5F\75\120       AVX512
+zmmreg_mz,zmmreg,mem512       \350\351\375\1\x5F\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16       \350\351\375\1\x5F\75\120       AVX512,TFV
+
+[VMAXSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_sae   \350\333\375\1\x5F\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\333\375\1\x5F\75\120       AVX512,T1S
+
+[VMINPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm        \350\375\1\x5D\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16       \350\375\1\x5D\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm        \350\364\375\1\x5D\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16       \350\364\375\1\x5D\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_sae   \350\351\375\1\x5D\75\120       AVX512
+zmmreg_mz,zmmreg,mem512       \350\351\375\1\x5D\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16       \350\351\375\1\x5D\75\120       AVX512,TFV
+
+[VMINSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_sae   \350\333\375\1\x5D\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\333\375\1\x5D\75\120       AVX512,T1S
+
+[VMULPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm        \350\375\1\x59\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16       \350\375\1\x59\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm        \350\364\375\1\x59\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16       \350\364\375\1\x59\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er    \350\351\375\1\x59\75\120       AVX512
+zmmreg_mz,zmmreg,mem512       \350\351\375\1\x59\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16       \350\351\375\1\x59\75\120       AVX512,TFV
+
+[VMULSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\333\375\1\x59\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\333\375\1\x59\75\120       AVX512,T1S
+
+[VRCPPH]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm               \350\361\376\1\x4C\110          AVX512,TFV
+xmmreg_mz,bmem16              \350\361\376\1\x4C\110          AVX512,TFV
+ymmreg_mz,ymmrm               \350\361\364\376\1\x4C\110      AVX512,TFV
+ymmreg_mz,bmem16              \350\361\364\376\1\x4C\110      AVX512,TFV
+zmmreg_mz,zmmrm               \350\361\351\376\1\x4C\110      AVX512,TFV
+zmmreg_mz,bmem16              \350\361\351\376\1\x4C\110      AVX512,TFV
+
+[VRCPSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg       \350\361\376\1\x4D\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\x4D\75\120       AVX512,T1S
+
+
+[VREDUCEPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmrm,imm8          \350\372\1\x56\110\26           AVX512,TFV
+xmmreg_mz,bmem16,imm8         \350\372\1\x56\110\26           AVX512,TFV
+ymmreg_mz,ymmrm,imm8          \350\364\372\1\x56\110\26       AVX512,TFV
+ymmreg_mz,bmem16,imm8         \350\364\372\1\x56\110\26       AVX512,TFV
+zmmreg_mz,zmmreg_sae,imm8     \350\351\372\1\x56\110\26       AVX512
+zmmreg_mz,mem512,imm8         \350\351\372\1\x56\110\26       AVX512,TFV
+zmmreg_mz,bmem16,imm8         \350\351\372\1\x56\110\26       AVX512,TFV
+
+[VREDUCESH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_sae,imm8  \350\372\1\x57\75\120\27    AVX512
+xmmreg_mz,xmmreg,mem16,imm8       \350\372\1\x57\75\120\27    AVX512,T1S
+
+
+[VRNDSCALEPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmrm,imm8          \350\372\1\x08\110\26           AVX512,TFV
+xmmreg_mz,bmem16,imm8         \350\372\1\x08\110\26           AVX512,TFV
+ymmreg_mz,ymmrm,imm8          \350\364\372\1\x08\110\26       AVX512,TFV
+ymmreg_mz,bmem16,imm8         \350\364\372\1\x08\110\26       AVX512,TFV
+zmmreg_mz,zmmreg_sae,imm8     \350\351\372\1\x08\110\26       AVX512
+zmmreg_mz,mem512,imm8         \350\351\372\1\x08\110\26       AVX512,TFV
+zmmreg_mz,bmem16,imm8         \350\351\372\1\x08\110\26       AVX512,TFV
+
+[VRNDSCALESH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_sae,imm8  \350\372\1\x0A\75\120\27    AVX512
+xmmreg_mz,xmmreg,mem16,imm8       \350\372\1\x0A\75\120\27    AVX512,T1S
+
+[VRSQRTPH]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm               \350\361\376\1\x4E\110          AVX512,TFV
+xmmreg_mz,bmem16              \350\361\376\1\x4E\110          AVX512,TFV
+ymmreg_mz,ymmrm               \350\361\364\376\1\x4E\110      AVX512,TFV
+ymmreg_mz,bmem16              \350\361\364\376\1\x4E\110      AVX512,TFV
+zmmreg_mz,zmmrm               \350\361\351\376\1\x4E\110      AVX512,TFV
+zmmreg_mz,bmem16              \350\361\351\376\1\x4E\110      AVX512,TFV
+
+[VRSQRTSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg       \350\361\376\1\x4F\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\x4F\75\120       AVX512,T1S
+
+[VSCALEFPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm        \350\361\376\1\x2C\75\120       AVX512,TFV
+xmmreg_mz,xmmreg,bmem16       \350\361\376\1\x2C\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm        \350\361\364\376\1\x2C\75\120   AVX512,TFV
+ymmreg_mz,ymmreg,bmem16       \350\361\364\376\1\x2C\75\120   AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er    \350\361\351\376\1\x2C\75\120   AVX512
+zmmreg_mz,zmmreg,mem512       \350\361\351\376\1\x2C\75\120   AVX512,TFV
+zmmreg_mz,zmmreg,bmem16       \350\361\351\376\1\x2C\75\120   AVX512,TFV
+
+[VSCALEFSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\361\376\1\x2D\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\361\376\1\x2D\75\120       AVX512,T1S
+
+[VSQRTPH]
+(Ch_Wop2, Ch_Rop1)
+xmmreg_mz,xmmrm               \350\375\1\x51\110              AVX512,TFV
+xmmreg_mz,bmem16              \350\375\1\x51\110              AVX512,TFV
+ymmreg_mz,ymmrm               \350\364\375\1\x51\110          AVX512,TFV
+ymmreg_mz,bmem16              \350\364\375\1\x51\110          AVX512,TFV
+zmmreg_mz,zmmreg_er           \350\351\375\1\x51\110          AVX512
+zmmreg_mz,mem512              \350\351\375\1\x51\110          AVX512,TFV
+zmmreg_mz,bmem16              \350\351\375\1\x51\110          AVX512,TFV
+
+[VSQRTSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\333\375\1\x51\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\333\375\1\x51\75\120       AVX512,T1S
+
+[VSUBPH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmrm        \350\375\1\x5C\75\120           AVX512,TFV
+xmmreg_mz,xmmreg,bmem16       \350\375\1\x5C\75\120           AVX512,TFV
+ymmreg_mz,ymmreg,ymmrm        \350\364\375\1\x5C\75\120       AVX512,TFV
+ymmreg_mz,ymmreg,bmem16       \350\364\375\1\x5C\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,zmmreg_er    \350\351\375\1\x5C\75\120       AVX512
+zmmreg_mz,zmmreg,mem512       \350\351\375\1\x5C\75\120       AVX512,TFV
+zmmreg_mz,zmmreg,bmem16       \350\351\375\1\x5C\75\120       AVX512,TFV
+
+[VSUBSH]
+(Ch_Wop3, Ch_Rop2, Ch_Rop1)
+xmmreg_mz,xmmreg,xmmreg_er    \350\333\375\1\x5C\75\120       AVX512
+xmmreg_mz,xmmreg,mem16        \350\333\375\1\x5C\75\120       AVX512,T1S
+
+[VUCOMISH]
+(Ch_Wop2, Ch_Rop1)
+xmmreg,xmmreg_sae             \350\375\1\x2E\110              AVX512
+xmmreg,mem16                  \350\375\1\x2E\110              AVX512,T1S

+ 179 - 0
compiler/x86_64/x8664ats.inc

@@ -1570,5 +1570,184 @@ attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
 attsufNONE,
+attsufMMX,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMX,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMX,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMX,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufMMS,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
+attsufNONE,
 attsufNONE
 attsufNONE
 );
 );

+ 180 - 1
compiler/x86_64/x8664att.inc

@@ -1569,6 +1569,185 @@
 'gf2p8affineinvqb',
 'gf2p8affineinvqb',
 'gf2p8affineqb',
 'gf2p8affineqb',
 'gf2p8mulb',
 'gf2p8mulb',
+'vcvtne2ps2bf16',
+'vcvtneps2bf16',
+'vdpbf16ps',
+'v4fmaddps',
+'v4fmaddss',
+'v4fnmaddps',
+'v4fnmaddss',
+'vp4dpwssd',
+'vp4dpwssds',
 'vp2intersectd',
 'vp2intersectd',
-'vp2intersectq'
+'vp2intersectq',
+'vmovw',
+'vmovsh',
+'vaddph',
+'vaddsh',
+'vcmpeqph',
+'vcmpltph',
+'vcmpleph',
+'vcmpunordph',
+'vcmpneqph',
+'vcmpnltph',
+'vcmpnleph',
+'vcmpordph',
+'vcmpeq_uqph',
+'vcmpngeph',
+'vcmpngtph',
+'vcmpfalseph',
+'vcmpneq_oqph',
+'vcmpgeph',
+'vcmpgtph',
+'vcmptrueph',
+'vcmpeq_osph',
+'vcmplt_oqph',
+'vcmple_oqph',
+'vcmpunord_sph',
+'vcmpneq_usph',
+'vcmpnlt_uqph',
+'vcmpnle_uqph',
+'vcmpord_sph',
+'vcmpeq_usph',
+'vcmpnge_uqph',
+'vcmpngt_uqph',
+'vcmpfalse_osph',
+'vcmpneq_osph',
+'vcmpge_oqph',
+'vcmpgt_oqph',
+'vcmptrue_usph',
+'vcmpeqsh',
+'vcmpltsh',
+'vcmplesh',
+'vcmpunordsh',
+'vcmpneqsh',
+'vcmpnltsh',
+'vcmpnlesh',
+'vcmpordsh',
+'vcmpeq_uqsh',
+'vcmpngesh',
+'vcmpngtsh',
+'vcmpfalsesh',
+'vcmpneq_oqsh',
+'vcmpgesh',
+'vcmpgtsh',
+'vcmptruesh',
+'vcmpeq_ossh',
+'vcmplt_oqsh',
+'vcmple_oqsh',
+'vcmpunord_ssh',
+'vcmpneq_ussh',
+'vcmpnlt_uqsh',
+'vcmpnle_uqsh',
+'vcmpord_ssh',
+'vcmpeq_ussh',
+'vcmpnge_uqsh',
+'vcmpngt_uqsh',
+'vcmpfalse_ossh',
+'vcmpneq_ossh',
+'vcmpge_oqsh',
+'vcmpgt_oqsh',
+'vcmptrue_ussh',
+'vcmpph',
+'vcmpsh',
+'vcomish',
+'vcvtdq2ph',
+'vcvtpd2ph',
+'vcvtph2dq',
+'vcvtph2pd',
+'vcvtph2psx',
+'vcvtph2qq',
+'vcvtph2udq',
+'vcvtph2uqq',
+'vcvtph2uw',
+'vcvtph2w',
+'vcvtps2phx',
+'vcvtqq2ph',
+'vcvtsd2sh',
+'vcvtsh2sd',
+'vcvtsh2si',
+'vcvtsh2ss',
+'vcvtsh2usi',
+'vcvtsi2sh',
+'vcvtss2sh',
+'vcvttph2dq',
+'vcvttph2qq',
+'vcvttph2udq',
+'vcvttph2uqq',
+'vcvttph2uw',
+'vcvttph2w',
+'vcvttsh2si',
+'vcvttsh2usi',
+'vcvtudq2ph',
+'vcvtuqq2ph',
+'vcvtusi2sh',
+'vcvtuw2ph',
+'vcvtw2ph',
+'vdivph',
+'vdivsh',
+'vfcmaddcph',
+'vfcmaddcsh',
+'vfmaddcph',
+'vfmaddcsh',
+'vfcmulcph',
+'vfcmulcsh',
+'vfmulcph',
+'vfmulcsh',
+'vfmaddsub132ph',
+'vfmaddsub213ph',
+'vfmaddsub231ph',
+'vfmsubadd132ph',
+'vfmsubadd213ph',
+'vfmsubadd231ph',
+'vfmadd132ph',
+'vfmadd213ph',
+'vfmadd231ph',
+'vfnmadd132ph',
+'vfnmadd213ph',
+'vfnmadd231ph',
+'vfmadd132sh',
+'vfmadd213sh',
+'vfmadd231sh',
+'vfnmadd132sh',
+'vfnmadd213sh',
+'vfnmadd231sh',
+'vfmsub132ph',
+'vfmsub213ph',
+'vfmsub231ph',
+'vfnmsub132ph',
+'vfnmsub213ph',
+'vfnmsub231ph',
+'vfmsub132sh',
+'vfmsub213sh',
+'vfmsub231sh',
+'vfnmsub132sh',
+'vfnmsub213sh',
+'vfnmsub231sh',
+'vfpclassph',
+'vfpclasssh',
+'vgetexpph',
+'vgetexpsh',
+'vgetmantph',
+'vgetmantsh',
+'vmaxph',
+'vmaxsh',
+'vminph',
+'vminsh',
+'vmulph',
+'vmulsh',
+'vrcpph',
+'vrcpsh',
+'vreduceph',
+'vreducesh',
+'vrndscaleph',
+'vrndscalesh',
+'vrsqrtph',
+'vrsqrtsh',
+'vscalefph',
+'vscalefsh',
+'vsqrtph',
+'vsqrtsh',
+'vsubph',
+'vsubsh',
+'vucomish'
 );
 );

+ 180 - 1
compiler/x86_64/x8664int.inc

@@ -1569,6 +1569,185 @@
 'gf2p8affineinvqb',
 'gf2p8affineinvqb',
 'gf2p8affineqb',
 'gf2p8affineqb',
 'gf2p8mulb',
 'gf2p8mulb',
+'vcvtne2ps2bf16',
+'vcvtneps2bf16',
+'vdpbf16ps',
+'v4fmaddps',
+'v4fmaddss',
+'v4fnmaddps',
+'v4fnmaddss',
+'vp4dpwssd',
+'vp4dpwssds',
 'vp2intersectd',
 'vp2intersectd',
-'vp2intersectq'
+'vp2intersectq',
+'vmovw',
+'vmovsh',
+'vaddph',
+'vaddsh',
+'vcmpeqph',
+'vcmpltph',
+'vcmpleph',
+'vcmpunordph',
+'vcmpneqph',
+'vcmpnltph',
+'vcmpnleph',
+'vcmpordph',
+'vcmpeq_uqph',
+'vcmpngeph',
+'vcmpngtph',
+'vcmpfalseph',
+'vcmpneq_oqph',
+'vcmpgeph',
+'vcmpgtph',
+'vcmptrueph',
+'vcmpeq_osph',
+'vcmplt_oqph',
+'vcmple_oqph',
+'vcmpunord_sph',
+'vcmpneq_usph',
+'vcmpnlt_uqph',
+'vcmpnle_uqph',
+'vcmpord_sph',
+'vcmpeq_usph',
+'vcmpnge_uqph',
+'vcmpngt_uqph',
+'vcmpfalse_osph',
+'vcmpneq_osph',
+'vcmpge_oqph',
+'vcmpgt_oqph',
+'vcmptrue_usph',
+'vcmpeqsh',
+'vcmpltsh',
+'vcmplesh',
+'vcmpunordsh',
+'vcmpneqsh',
+'vcmpnltsh',
+'vcmpnlesh',
+'vcmpordsh',
+'vcmpeq_uqsh',
+'vcmpngesh',
+'vcmpngtsh',
+'vcmpfalsesh',
+'vcmpneq_oqsh',
+'vcmpgesh',
+'vcmpgtsh',
+'vcmptruesh',
+'vcmpeq_ossh',
+'vcmplt_oqsh',
+'vcmple_oqsh',
+'vcmpunord_ssh',
+'vcmpneq_ussh',
+'vcmpnlt_uqsh',
+'vcmpnle_uqsh',
+'vcmpord_ssh',
+'vcmpeq_ussh',
+'vcmpnge_uqsh',
+'vcmpngt_uqsh',
+'vcmpfalse_ossh',
+'vcmpneq_ossh',
+'vcmpge_oqsh',
+'vcmpgt_oqsh',
+'vcmptrue_ussh',
+'vcmpph',
+'vcmpsh',
+'vcomish',
+'vcvtdq2ph',
+'vcvtpd2ph',
+'vcvtph2dq',
+'vcvtph2pd',
+'vcvtph2psx',
+'vcvtph2qq',
+'vcvtph2udq',
+'vcvtph2uqq',
+'vcvtph2uw',
+'vcvtph2w',
+'vcvtps2phx',
+'vcvtqq2ph',
+'vcvtsd2sh',
+'vcvtsh2sd',
+'vcvtsh2si',
+'vcvtsh2ss',
+'vcvtsh2usi',
+'vcvtsi2sh',
+'vcvtss2sh',
+'vcvttph2dq',
+'vcvttph2qq',
+'vcvttph2udq',
+'vcvttph2uqq',
+'vcvttph2uw',
+'vcvttph2w',
+'vcvttsh2si',
+'vcvttsh2usi',
+'vcvtudq2ph',
+'vcvtuqq2ph',
+'vcvtusi2sh',
+'vcvtuw2ph',
+'vcvtw2ph',
+'vdivph',
+'vdivsh',
+'vfcmaddcph',
+'vfcmaddcsh',
+'vfmaddcph',
+'vfmaddcsh',
+'vfcmulcph',
+'vfcmulcsh',
+'vfmulcph',
+'vfmulcsh',
+'vfmaddsub132ph',
+'vfmaddsub213ph',
+'vfmaddsub231ph',
+'vfmsubadd132ph',
+'vfmsubadd213ph',
+'vfmsubadd231ph',
+'vfmadd132ph',
+'vfmadd213ph',
+'vfmadd231ph',
+'vfnmadd132ph',
+'vfnmadd213ph',
+'vfnmadd231ph',
+'vfmadd132sh',
+'vfmadd213sh',
+'vfmadd231sh',
+'vfnmadd132sh',
+'vfnmadd213sh',
+'vfnmadd231sh',
+'vfmsub132ph',
+'vfmsub213ph',
+'vfmsub231ph',
+'vfnmsub132ph',
+'vfnmsub213ph',
+'vfnmsub231ph',
+'vfmsub132sh',
+'vfmsub213sh',
+'vfmsub231sh',
+'vfnmsub132sh',
+'vfnmsub213sh',
+'vfnmsub231sh',
+'vfpclassph',
+'vfpclasssh',
+'vgetexpph',
+'vgetexpsh',
+'vgetmantph',
+'vgetmantsh',
+'vmaxph',
+'vmaxsh',
+'vminph',
+'vminsh',
+'vmulph',
+'vmulsh',
+'vrcpph',
+'vrcpsh',
+'vreduceph',
+'vreducesh',
+'vrndscaleph',
+'vrndscalesh',
+'vrsqrtph',
+'vrsqrtsh',
+'vscalefph',
+'vscalefsh',
+'vsqrtph',
+'vsqrtsh',
+'vsubph',
+'vsubsh',
+'vucomish'
 );
 );

+ 1 - 1
compiler/x86_64/x8664nop.inc

@@ -1,2 +1,2 @@
 { don't edit, this file is generated from x86ins.dat }
 { don't edit, this file is generated from x86ins.dat }
-5175;
+6061;

+ 180 - 1
compiler/x86_64/x8664op.inc

@@ -1569,6 +1569,185 @@ A_VGF2P8MULB,
 A_GF2P8AFFINEINVQB,
 A_GF2P8AFFINEINVQB,
 A_GF2P8AFFINEQB,
 A_GF2P8AFFINEQB,
 A_GF2P8MULB,
 A_GF2P8MULB,
+A_VCVTNE2PS2BF16,
+A_VCVTNEPS2BF16,
+A_VDPBF16PS,
+A_V4FMADDPS,
+A_V4FMADDSS,
+A_V4FNMADDPS,
+A_V4FNMADDSS,
+A_VP4DPWSSD,
+A_VP4DPWSSDS,
 A_VP2INTERSECTD,
 A_VP2INTERSECTD,
-A_VP2INTERSECTQ
+A_VP2INTERSECTQ,
+A_VMOVW,
+A_VMOVSH,
+A_VADDPH,
+A_VADDSH,
+A_VCMPEQPH,
+A_VCMPLTPH,
+A_VCMPLEPH,
+A_VCMPUNORDPH,
+A_VCMPNEQPH,
+A_VCMPNLTPH,
+A_VCMPNLEPH,
+A_VCMPORDPH,
+A_VCMPEQ_UQPH,
+A_VCMPNGEPH,
+A_VCMPNGTPH,
+A_VCMPFALSEPH,
+A_VCMPNEQ_OQPH,
+A_VCMPGEPH,
+A_VCMPGTPH,
+A_VCMPTRUEPH,
+A_VCMPEQ_OSPH,
+A_VCMPLT_OQPH,
+A_VCMPLE_OQPH,
+A_VCMPUNORD_SPH,
+A_VCMPNEQ_USPH,
+A_VCMPNLT_UQPH,
+A_VCMPNLE_UQPH,
+A_VCMPORD_SPH,
+A_VCMPEQ_USPH,
+A_VCMPNGE_UQPH,
+A_VCMPNGT_UQPH,
+A_VCMPFALSE_OSPH,
+A_VCMPNEQ_OSPH,
+A_VCMPGE_OQPH,
+A_VCMPGT_OQPH,
+A_VCMPTRUE_USPH,
+A_VCMPEQSH,
+A_VCMPLTSH,
+A_VCMPLESH,
+A_VCMPUNORDSH,
+A_VCMPNEQSH,
+A_VCMPNLTSH,
+A_VCMPNLESH,
+A_VCMPORDSH,
+A_VCMPEQ_UQSH,
+A_VCMPNGESH,
+A_VCMPNGTSH,
+A_VCMPFALSESH,
+A_VCMPNEQ_OQSH,
+A_VCMPGESH,
+A_VCMPGTSH,
+A_VCMPTRUESH,
+A_VCMPEQ_OSSH,
+A_VCMPLT_OQSH,
+A_VCMPLE_OQSH,
+A_VCMPUNORD_SSH,
+A_VCMPNEQ_USSH,
+A_VCMPNLT_UQSH,
+A_VCMPNLE_UQSH,
+A_VCMPORD_SSH,
+A_VCMPEQ_USSH,
+A_VCMPNGE_UQSH,
+A_VCMPNGT_UQSH,
+A_VCMPFALSE_OSSH,
+A_VCMPNEQ_OSSH,
+A_VCMPGE_OQSH,
+A_VCMPGT_OQSH,
+A_VCMPTRUE_USSH,
+A_VCMPPH,
+A_VCMPSH,
+A_VCOMISH,
+A_VCVTDQ2PH,
+A_VCVTPD2PH,
+A_VCVTPH2DQ,
+A_VCVTPH2PD,
+A_VCVTPH2PSX,
+A_VCVTPH2QQ,
+A_VCVTPH2UDQ,
+A_VCVTPH2UQQ,
+A_VCVTPH2UW,
+A_VCVTPH2W,
+A_VCVTPS2PHX,
+A_VCVTQQ2PH,
+A_VCVTSD2SH,
+A_VCVTSH2SD,
+A_VCVTSH2SI,
+A_VCVTSH2SS,
+A_VCVTSH2USI,
+A_VCVTSI2SH,
+A_VCVTSS2SH,
+A_VCVTTPH2DQ,
+A_VCVTTPH2QQ,
+A_VCVTTPH2UDQ,
+A_VCVTTPH2UQQ,
+A_VCVTTPH2UW,
+A_VCVTTPH2W,
+A_VCVTTSH2SI,
+A_VCVTTSH2USI,
+A_VCVTUDQ2PH,
+A_VCVTUQQ2PH,
+A_VCVTUSI2SH,
+A_VCVTUW2PH,
+A_VCVTW2PH,
+A_VDIVPH,
+A_VDIVSH,
+A_VFCMADDCPH,
+A_VFCMADDCSH,
+A_VFMADDCPH,
+A_VFMADDCSH,
+A_VFCMULCPH,
+A_VFCMULCSH,
+A_VFMULCPH,
+A_VFMULCSH,
+A_VFMADDSUB132PH,
+A_VFMADDSUB213PH,
+A_VFMADDSUB231PH,
+A_VFMSUBADD132PH,
+A_VFMSUBADD213PH,
+A_VFMSUBADD231PH,
+A_VFMADD132PH,
+A_VFMADD213PH,
+A_VFMADD231PH,
+A_VFNMADD132PH,
+A_VFNMADD213PH,
+A_VFNMADD231PH,
+A_VFMADD132SH,
+A_VFMADD213SH,
+A_VFMADD231SH,
+A_VFNMADD132SH,
+A_VFNMADD213SH,
+A_VFNMADD231SH,
+A_VFMSUB132PH,
+A_VFMSUB213PH,
+A_VFMSUB231PH,
+A_VFNMSUB132PH,
+A_VFNMSUB213PH,
+A_VFNMSUB231PH,
+A_VFMSUB132SH,
+A_VFMSUB213SH,
+A_VFMSUB231SH,
+A_VFNMSUB132SH,
+A_VFNMSUB213SH,
+A_VFNMSUB231SH,
+A_VFPCLASSPH,
+A_VFPCLASSSH,
+A_VGETEXPPH,
+A_VGETEXPSH,
+A_VGETMANTPH,
+A_VGETMANTSH,
+A_VMAXPH,
+A_VMAXSH,
+A_VMINPH,
+A_VMINSH,
+A_VMULPH,
+A_VMULSH,
+A_VRCPPH,
+A_VRCPSH,
+A_VREDUCEPH,
+A_VREDUCESH,
+A_VRNDSCALEPH,
+A_VRNDSCALESH,
+A_VRSQRTPH,
+A_VRSQRTSH,
+A_VSCALEFPH,
+A_VSCALEFSH,
+A_VSQRTPH,
+A_VSQRTSH,
+A_VSUBPH,
+A_VSUBSH,
+A_VUCOMISH
 );
 );

+ 180 - 1
compiler/x86_64/x8664pro.inc

@@ -1570,5 +1570,184 @@
 (Ch: [Ch_Mop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Mop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Mop2, Ch_Rop1]),
 (Ch: [Ch_Mop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
 (Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
-(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1])
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_All]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_All]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Wop4, Ch_Rop3, Ch_Rop2]),
+(Ch: [Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop3, Ch_Rop2, Ch_Rop1]),
+(Ch: [Ch_Wop2, Ch_Rop1])
 );
 );

File diff suppressed because it is too large
+ 421 - 106
compiler/x86_64/x8664tab.inc


Some files were not shown because too many files changed in this diff