linux-kernel - Re: [PATCH] x86: XOP prefix instructions decoder support

lists.openwall.net		lists / announce owl-users owl-dev john-users john-dev passwdqc-users yescrypt popa3d-users / oss-security kernel-hardening musl sabotage tlsify passwords / crypt-dev xvendor / Bugtraq Full-Disclosure linux-kernel linux-netdev linux-ext4 linux-hardening linux-cve-announce PHC
Open Source and information security mailing list archives
Hash Suite: Windows password security audit tool. GUI, reports in PDF.
[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-Id: <20250817093240.527825424989e5e2337b5775@kernel.org>
Date: Sun, 17 Aug 2025 09:32:40 +0900
From: Masami Hiramatsu (Google) <mhiramat@...nel.org>
To: "Alan J . Wylie" <alan@...ie.me.uk>, "Masami Hiramatsu (Google)"
 <mhiramat@...nel.org>
Cc: Josh Poimboeuf <jpoimboe@...nel.org>, Thomas Gleixner
 <tglx@...utronix.de>, Ingo Molnar <mingo@...hat.com>, Borislav Petkov
 <bp@...en8.de>, Dave Hansen <dave.hansen@...ux.intel.com>, "Alan J . Wylie"
 <alan@...ie.me.uk>, linux-kernel@...r.kernel.org,
 regressions@...ts.linux.dev, stable@...r.kernel.org, Linus Torvalds
 <torvalds@...ux-foundation.org>, x86@...nel.org, "H . Peter Anvin"
 <hpa@...or.com>
Subject: Re: [PATCH] x86: XOP prefix instructions decoder support

Hi Alan, 

Can you test this with our cros-compile build?

Thank you,

On Wed, 30 Jul 2025 16:46:52 +0900
"Masami Hiramatsu (Google)" <mhiramat@...nel.org> wrote:

> From: Masami Hiramatsu (Google) <mhiramat@...nel.org>
> 
> Support decoding AMD's XOP prefix encoded instructions.
> 
> These instructions are introduced for Bulldozer micro architecture,
> and not supported on Intel's processors. But when compiling kernel
> with CONFIG_X86_NATIVE_CPU on some AMD processor (e.g. -march=bdver2),
> these instructions can be used.
> 
> Reported-by: Alan J. Wylie <alan@...ie.me.uk>
> Closes: https://lore.kernel.org/all/871pq06728.fsf@wylie.me.uk/
> Signed-off-by: Masami Hiramatsu (Google) <mhiramat@...nel.org>
> ---
>  arch/x86/include/asm/inat.h                        |   15 +++
>  arch/x86/include/asm/insn.h                        |   51 +++++++++
>  arch/x86/lib/inat.c                                |   13 ++
>  arch/x86/lib/insn.c                                |   35 +++++-
>  arch/x86/lib/x86-opcode-map.txt                    |  111 ++++++++++++++++++++
>  arch/x86/tools/gen-insn-attr-x86.awk               |   44 ++++++++
>  tools/arch/x86/include/asm/inat.h                  |   15 +++
>  tools/arch/x86/include/asm/insn.h                  |   51 +++++++++
>  tools/arch/x86/lib/inat.c                          |   13 ++
>  tools/arch/x86/lib/insn.c                          |   35 +++++-
>  tools/arch/x86/lib/x86-opcode-map.txt              |  111 ++++++++++++++++++++
>  tools/arch/x86/tools/gen-insn-attr-x86.awk         |   44 ++++++++
>  .../util/intel-pt-decoder/intel-pt-insn-decoder.c  |    2 
>  13 files changed, 513 insertions(+), 27 deletions(-)
> 
> diff --git a/arch/x86/include/asm/inat.h b/arch/x86/include/asm/inat.h
> index 97f341777db5..1b3060a3425c 100644
> --- a/arch/x86/include/asm/inat.h
> +++ b/arch/x86/include/asm/inat.h
> @@ -37,6 +37,8 @@
>  #define INAT_PFX_EVEX	15	/* EVEX prefix */
>  /* x86-64 REX2 prefix */
>  #define INAT_PFX_REX2	16	/* 0xD5 */
> +/* AMD XOP prefix */
> +#define INAT_PFX_XOP	17	/* 0x8F */
>  
>  #define INAT_LSTPFX_MAX	3
>  #define INAT_LGCPFX_MAX	11
> @@ -77,6 +79,7 @@
>  #define INAT_MOFFSET	(1 << (INAT_FLAG_OFFS + 3))
>  #define INAT_VARIANT	(1 << (INAT_FLAG_OFFS + 4))
>  #define INAT_VEXOK	(1 << (INAT_FLAG_OFFS + 5))
> +#define INAT_XOPOK	INAT_VEXOK
>  #define INAT_VEXONLY	(1 << (INAT_FLAG_OFFS + 6))
>  #define INAT_EVEXONLY	(1 << (INAT_FLAG_OFFS + 7))
>  #define INAT_NO_REX2	(1 << (INAT_FLAG_OFFS + 8))
> @@ -111,6 +114,8 @@ extern insn_attr_t inat_get_group_attribute(insn_byte_t modrm,
>  extern insn_attr_t inat_get_avx_attribute(insn_byte_t opcode,
>  					  insn_byte_t vex_m,
>  					  insn_byte_t vex_pp);
> +extern insn_attr_t inat_get_xop_attribute(insn_byte_t opcode,
> +					  insn_byte_t map_select);
>  
>  /* Attribute checking functions */
>  static inline int inat_is_legacy_prefix(insn_attr_t attr)
> @@ -164,6 +169,11 @@ static inline int inat_is_vex3_prefix(insn_attr_t attr)
>  	return (attr & INAT_PFX_MASK) == INAT_PFX_VEX3;
>  }
>  
> +static inline int inat_is_xop_prefix(insn_attr_t attr)
> +{
> +	return (attr & INAT_PFX_MASK) == INAT_PFX_XOP;
> +}
> +
>  static inline int inat_is_escape(insn_attr_t attr)
>  {
>  	return attr & INAT_ESC_MASK;
> @@ -229,6 +239,11 @@ static inline int inat_accept_vex(insn_attr_t attr)
>  	return attr & INAT_VEXOK;
>  }
>  
> +static inline int inat_accept_xop(insn_attr_t attr)
> +{
> +	return attr & INAT_XOPOK;
> +}
> +
>  static inline int inat_must_vex(insn_attr_t attr)
>  {
>  	return attr & (INAT_VEXONLY | INAT_EVEXONLY);
> diff --git a/arch/x86/include/asm/insn.h b/arch/x86/include/asm/insn.h
> index 7152ea809e6a..091f88c8254d 100644
> --- a/arch/x86/include/asm/insn.h
> +++ b/arch/x86/include/asm/insn.h
> @@ -71,7 +71,10 @@ struct insn {
>  					 * prefixes.bytes[3]: last prefix
>  					 */
>  	struct insn_field rex_prefix;	/* REX prefix */
> -	struct insn_field vex_prefix;	/* VEX prefix */
> +	union {
> +		struct insn_field vex_prefix;	/* VEX prefix */
> +		struct insn_field xop_prefix;	/* XOP prefix */
> +	};
>  	struct insn_field opcode;	/*
>  					 * opcode.bytes[0]: opcode1
>  					 * opcode.bytes[1]: opcode2
> @@ -135,6 +138,17 @@ struct insn {
>  #define X86_VEX_V(vex)	(((vex) & 0x78) >> 3)	/* VEX3 Byte2, VEX2 Byte1 */
>  #define X86_VEX_P(vex)	((vex) & 0x03)		/* VEX3 Byte2, VEX2 Byte1 */
>  #define X86_VEX_M_MAX	0x1f			/* VEX3.M Maximum value */
> +/* XOP bit fields */
> +#define X86_XOP_R(xop)	((xop) & 0x80)	/* XOP Byte2 */
> +#define X86_XOP_X(xop)	((xop) & 0x40)	/* XOP Byte2 */
> +#define X86_XOP_B(xop)	((xop) & 0x20)	/* XOP Byte2 */
> +#define X86_XOP_M(xop)	((xop) & 0x1f)	/* XOP Byte2 */
> +#define X86_XOP_W(xop)	((xop) & 0x80)	/* XOP Byte3 */
> +#define X86_XOP_V(xop)	((xop) & 0x78)	/* XOP Byte3 */
> +#define X86_XOP_L(xop)	((xop) & 0x04)	/* XOP Byte3 */
> +#define X86_XOP_P(xop)	((xop) & 0x03)	/* XOP Byte3 */
> +#define X86_XOP_M_MIN	0x08	/* Min of XOP.M */
> +#define X86_XOP_M_MAX	0x1f	/* Max of XOP.M */
>  
>  extern void insn_init(struct insn *insn, const void *kaddr, int buf_len, int x86_64);
>  extern int insn_get_prefixes(struct insn *insn);
> @@ -178,7 +192,7 @@ static inline insn_byte_t insn_rex2_m_bit(struct insn *insn)
>  	return X86_REX2_M(insn->rex_prefix.bytes[1]);
>  }
>  
> -static inline int insn_is_avx(struct insn *insn)
> +static inline int insn_is_avx_or_xop(struct insn *insn)
>  {
>  	if (!insn->prefixes.got)
>  		insn_get_prefixes(insn);
> @@ -192,6 +206,22 @@ static inline int insn_is_evex(struct insn *insn)
>  	return (insn->vex_prefix.nbytes == 4);
>  }
>  
> +/* If we already know this is AVX/XOP encoded */
> +static inline int avx_insn_is_xop(struct insn *insn)
> +{
> +	insn_attr_t attr = inat_get_opcode_attribute(insn->vex_prefix.bytes[0]);
> +
> +	return inat_is_xop_prefix(attr);
> +}
> +
> +static inline int insn_is_xop(struct insn *insn)
> +{
> +	if (!insn_is_avx_or_xop(insn))
> +		return 0;
> +
> +	return avx_insn_is_xop(insn);
> +}
> +
>  static inline int insn_has_emulate_prefix(struct insn *insn)
>  {
>  	return !!insn->emulate_prefix_size;
> @@ -222,11 +252,26 @@ static inline insn_byte_t insn_vex_w_bit(struct insn *insn)
>  	return X86_VEX_W(insn->vex_prefix.bytes[2]);
>  }
>  
> +static inline insn_byte_t insn_xop_map_bits(struct insn *insn)
> +{
> +	if (insn->xop_prefix.nbytes < 3)	/* XOP is 3 bytes */
> +		return 0;
> +	return X86_XOP_M(insn->xop_prefix.bytes[1]);
> +}
> +
> +static inline insn_byte_t insn_xop_p_bits(struct insn *insn)
> +{
> +	return X86_XOP_P(insn->vex_prefix.bytes[2]);
> +}
> +
>  /* Get the last prefix id from last prefix or VEX prefix */
>  static inline int insn_last_prefix_id(struct insn *insn)
>  {
> -	if (insn_is_avx(insn))
> +	if (insn_is_avx_or_xop(insn)) {
> +		if (avx_insn_is_xop(insn))
> +			return insn_xop_p_bits(insn);
>  		return insn_vex_p_bits(insn);	/* VEX_p is a SIMD prefix id */
> +	}
>  
>  	if (insn->prefixes.bytes[3])
>  		return inat_get_last_prefix_id(insn->prefixes.bytes[3]);
> diff --git a/arch/x86/lib/inat.c b/arch/x86/lib/inat.c
> index b0f3b2a62ae2..a5cafd402cfd 100644
> --- a/arch/x86/lib/inat.c
> +++ b/arch/x86/lib/inat.c
> @@ -81,3 +81,16 @@ insn_attr_t inat_get_avx_attribute(insn_byte_t opcode, insn_byte_t vex_m,
>  	return table[opcode];
>  }
>  
> +insn_attr_t inat_get_xop_attribute(insn_byte_t opcode, insn_byte_t map_select)
> +{
> +	const insn_attr_t *table;
> +
> +	if (map_select < X86_XOP_M_MIN || map_select > X86_XOP_M_MAX)
> +		return 0;
> +	map_select -= X86_XOP_M_MIN;
> +	/* At first, this checks the master table */
> +	table = inat_xop_tables[map_select];
> +	if (!table)
> +		return 0;
> +	return table[opcode];
> +}
> diff --git a/arch/x86/lib/insn.c b/arch/x86/lib/insn.c
> index 149a57e334ab..225af1399c9d 100644
> --- a/arch/x86/lib/insn.c
> +++ b/arch/x86/lib/insn.c
> @@ -200,12 +200,15 @@ int insn_get_prefixes(struct insn *insn)
>  	}
>  	insn->rex_prefix.got = 1;
>  
> -	/* Decode VEX prefix */
> +	/* Decode VEX/XOP prefix */
>  	b = peek_next(insn_byte_t, insn);
> -	attr = inat_get_opcode_attribute(b);
> -	if (inat_is_vex_prefix(attr)) {
> +	if (inat_is_vex_prefix(attr) || inat_is_xop_prefix(attr)) {
>  		insn_byte_t b2 = peek_nbyte_next(insn_byte_t, insn, 1);
> -		if (!insn->x86_64) {
> +
> +		if (inat_is_xop_prefix(attr) && X86_MODRM_REG(b2) == 0) {
> +			/* Grp1A.0 is always POP Ev */
> +			goto vex_end;
> +		} else if (!insn->x86_64) {
>  			/*
>  			 * In 32-bits mode, if the [7:6] bits (mod bits of
>  			 * ModRM) on the second byte are not 11b, it is
> @@ -226,13 +229,13 @@ int insn_get_prefixes(struct insn *insn)
>  			if (insn->x86_64 && X86_VEX_W(b2))
>  				/* VEX.W overrides opnd_size */
>  				insn->opnd_bytes = 8;
> -		} else if (inat_is_vex3_prefix(attr)) {
> +		} else if (inat_is_vex3_prefix(attr) || inat_is_xop_prefix(attr)) {
>  			b2 = peek_nbyte_next(insn_byte_t, insn, 2);
>  			insn_set_byte(&insn->vex_prefix, 2, b2);
>  			insn->vex_prefix.nbytes = 3;
>  			insn->next_byte += 3;
>  			if (insn->x86_64 && X86_VEX_W(b2))
> -				/* VEX.W overrides opnd_size */
> +				/* VEX.W/XOP.W overrides opnd_size */
>  				insn->opnd_bytes = 8;
>  		} else {
>  			/*
> @@ -288,9 +291,22 @@ int insn_get_opcode(struct insn *insn)
>  	insn_set_byte(opcode, 0, op);
>  	opcode->nbytes = 1;
>  
> -	/* Check if there is VEX prefix or not */
> -	if (insn_is_avx(insn)) {
> +	/* Check if there is VEX/XOP prefix or not */
> +	if (insn_is_avx_or_xop(insn)) {
>  		insn_byte_t m, p;
> +
> +		/* XOP prefix has different encoding */
> +		if (unlikely(avx_insn_is_xop(insn))) {
> +			m = insn_xop_map_bits(insn);
> +			insn->attr = inat_get_xop_attribute(op, m);
> +			if (!inat_accept_xop(insn->attr)) {
> +				insn->attr = 0;
> +				return -EINVAL;
> +			}
> +			/* XOP has only 1 byte for opcode */
> +			goto end;
> +		}
> +
>  		m = insn_vex_m_bits(insn);
>  		p = insn_vex_p_bits(insn);
>  		insn->attr = inat_get_avx_attribute(op, m, p);
> @@ -383,7 +399,8 @@ int insn_get_modrm(struct insn *insn)
>  			pfx_id = insn_last_prefix_id(insn);
>  			insn->attr = inat_get_group_attribute(mod, pfx_id,
>  							      insn->attr);
> -			if (insn_is_avx(insn) && !inat_accept_vex(insn->attr)) {
> +			if (insn_is_avx_or_xop(insn) && !inat_accept_vex(insn->attr) &&
> +			    !inat_accept_xop(insn->attr)) {
>  				/* Bad insn */
>  				insn->attr = 0;
>  				return -EINVAL;
> diff --git a/arch/x86/lib/x86-opcode-map.txt b/arch/x86/lib/x86-opcode-map.txt
> index 262f7ca1fb95..2a4e69ecc2de 100644
> --- a/arch/x86/lib/x86-opcode-map.txt
> +++ b/arch/x86/lib/x86-opcode-map.txt
> @@ -27,6 +27,11 @@
>  #  (evo): this opcode is changed by EVEX prefix (EVEX opcode)
>  #  (v): this opcode requires VEX prefix.
>  #  (v1): this opcode only supports 128bit VEX.
> +#  (xop): this opcode accepts XOP prefix.
> +#
> +# XOP Superscripts
> +#  (W=0): this opcode requires XOP.W == 0
> +#  (W=1): this opcode requires XOP.W == 1
>  #
>  # Last Prefix Superscripts
>  #  - (66): the last prefix is 0x66
> @@ -194,7 +199,7 @@ AVXcode:
>  8c: MOV Ev,Sw
>  8d: LEA Gv,M
>  8e: MOV Sw,Ew
> -8f: Grp1A (1A) | POP Ev (d64)
> +8f: Grp1A (1A) | POP Ev (d64) | XOP (Prefix)
>  # 0x90 - 0x9f
>  90: NOP | PAUSE (F3) | XCHG r8,rAX
>  91: XCHG rCX/r9,rAX
> @@ -1106,6 +1111,84 @@ AVXcode: 7
>  f8: URDMSR Rq,Id (F2),(v1),(11B) | UWRMSR Id,Rq (F3),(v1),(11B)
>  EndTable
>  
> +# From AMD64 Architecture Programmer's Manual Vol3, Appendix A.1.5
> +Table: XOP map 8h
> +Referrer:
> +XOPcode: 0
> +85: VPMACSSWW Vo,Ho,Wo,Lo
> +86: VPMACSSWD Vo,Ho,Wo,Lo
> +87: VPMACSSDQL Vo,Ho,Wo,Lo
> +8e: VPMACSSDD Vo,Ho,Wo,Lo
> +8f: VPMACSSDQH Vo,Ho,Wo,Lo
> +95: VPMACSWW Vo,Ho,Wo,Lo
> +96: VPMACSWD Vo,Ho,Wo,Lo
> +97: VPMACSDQL Vo,Ho,Wo,Lo
> +9e: VPMACSDD Vo,Ho,Wo,Lo
> +9f: VPMACSDQH Vo,Ho,Wo,Lo
> +a2: VPCMOV Vx,Hx,Wx,Lx (W=0) | VPCMOV Vx,Hx,Lx,Wx (W=1)
> +a3: VPPERM Vo,Ho,Wo,Lo (W=0) | VPPERM Vo,Ho,Lo,Wo (W=1)
> +a6: VPMADCSSWD Vo,Ho,Wo,Lo
> +b6: VPMADCSWD Vo,Ho,Wo,Lo
> +c0: VPROTB Vo,Wo,Ib
> +c1: VPROTW Vo,Wo,Ib
> +c2: VPROTD Vo,Wo,Ib
> +c3: VPROTQ Vo,Wo,Ib
> +cc: VPCOMccB Vo,Ho,Wo,Ib
> +cd: VPCOMccW Vo,Ho,Wo,Ib
> +ce: VPCOMccD Vo,Ho,Wo,Ib
> +cf: VPCOMccQ Vo,Ho,Wo,Ib
> +ec: VPCOMccUB Vo,Ho,Wo,Ib
> +ed: VPCOMccUW Vo,Ho,Wo,Ib
> +ee: VPCOMccUD Vo,Ho,Wo,Ib
> +ef: VPCOMccUQ Vo,Ho,Wo,Ib
> +EndTable
> +
> +Table: XOP map 9h
> +Referrer:
> +XOPcode: 1
> +01: GrpXOP1
> +02: GrpXOP2
> +12: GrpXOP3
> +80: VFRCZPS Vx,Wx
> +81: VFRCZPD Vx,Wx
> +82: VFRCZSS Vq,Wss
> +83: VFRCZSD Vq,Wsd
> +90: VPROTB Vo,Wo,Ho (W=0) | VPROTB Vo,Ho,Wo (W=1)
> +91: VPROTW Vo,Wo,Ho (W=0) | VPROTB Vo,Ho,Wo (W=1)
> +92: VPROTD Vo,Wo,Ho (W=0) | VPROTB Vo,Ho,Wo (W=1)
> +93: VPROTQ Vo,Wo,Ho (W=0) | VPROTB Vo,Ho,Wo (W=1)
> +94: VPSHLB Vo,Wo,Ho (W=0) | VPSHLB Vo,Ho,Wo (W=1)
> +95: VPSHLW Vo,Wo,Ho (W=0) | VPSHLW Vo,Ho,Wo (W=1)
> +96: VPSHLD Vo,Wo,Ho (W=0) | VPSHLD Vo,Ho,Wo (W=1)
> +97: VPSHLQ Vo,Wo,Ho (W=0) | VPSHLQ Vo,Ho,Wo (W=1)
> +98: VPSHAB Vo,Wo,Ho (W=0) | VPSHAB Vo,Ho,Wo (W=1)
> +99: VPSHAW Vo,Wo,Ho (W=0) | VPSHAW Vo,Ho,Wo (W=1)
> +9a: VPSHAD Vo,Wo,Ho (W=0) | VPSHAD Vo,Ho,Wo (W=1)
> +9b: VPSHAQ Vo,Wo,Ho (W=0) | VPSHAQ Vo,Ho,Wo (W=1)
> +c1: VPHADDBW Vo,Wo
> +c2: VPHADDBD Vo,Wo
> +c3: VPHADDBQ Vo,Wo
> +c6: VPHADDWD Vo,Wo
> +c7: VPHADDWQ Vo,Wo
> +cb: VPHADDDQ Vo,Wo
> +d1: VPHADDUBWD Vo,Wo
> +d2: VPHADDUBD Vo,Wo
> +d3: VPHADDUBQ Vo,Wo
> +d6: VPHADDUWD Vo,Wo
> +d7: VPHADDUWQ Vo,Wo
> +db: VPHADDUDQ Vo,Wo
> +e1: VPHSUBBW Vo,Wo
> +e2: VPHSUBWD Vo,Wo
> +e3: VPHSUBDQ Vo,Wo
> +EndTable
> +
> +Table: XOP map Ah
> +Referrer:
> +XOPcode: 2
> +10: BEXTR Gy,Ey,Id
> +12: GrpXOP4
> +EndTable
> +
>  GrpTable: Grp1
>  0: ADD
>  1: OR
> @@ -1320,3 +1403,29 @@ GrpTable: GrpRNG
>  4: xcrypt-cfb
>  5: xcrypt-ofb
>  EndTable
> +
> +# GrpXOP1-4 is shown in AMD APM Vol.3 Appendix A as XOP group #1-4
> +GrpTable: GrpXOP1
> +1: BLCFILL By,Ey (xop)
> +2: BLSFILL By,Ey (xop)
> +3: BLCS By,Ey (xop)
> +4: TZMSK By,Ey (xop)
> +5: BLCIC By,Ey (xop)
> +6: BLSIC By,Ey (xop)
> +7: T1MSKC By,Ey (xop)
> +EndTable
> +
> +GrpTable: GrpXOP2
> +1: BLCMSK By,Ey (xop)
> +6: BLCI By,Ey (xop)
> +EndTable
> +
> +GrpTable: GrpXOP3
> +0: LLWPCB Ry (xop)
> +1: SLWPCB Ry (xop)
> +EndTable
> +
> +GrpTable: GrpXOP4
> +0: LWPINS By,Ed,Id (xop)
> +1: LWPVAL By,Ed,Id (xop)
> +EndTable
> diff --git a/arch/x86/tools/gen-insn-attr-x86.awk b/arch/x86/tools/gen-insn-attr-x86.awk
> index 2c19d7fc8a85..7ea1b75e59b7 100644
> --- a/arch/x86/tools/gen-insn-attr-x86.awk
> +++ b/arch/x86/tools/gen-insn-attr-x86.awk
> @@ -21,6 +21,7 @@ function clear_vars() {
>  	eid = -1 # escape id
>  	gid = -1 # group id
>  	aid = -1 # AVX id
> +	xopid = -1 # XOP id
>  	tname = ""
>  }
>  
> @@ -39,9 +40,11 @@ BEGIN {
>  	ggid = 1
>  	geid = 1
>  	gaid = 0
> +	gxopid = 0
>  	delete etable
>  	delete gtable
>  	delete atable
> +	delete xoptable
>  
>  	opnd_expr = "^[A-Za-z/]"
>  	ext_expr = "^\\("
> @@ -61,6 +64,7 @@ BEGIN {
>  	imm_flag["Ob"] = "INAT_MOFFSET"
>  	imm_flag["Ov"] = "INAT_MOFFSET"
>  	imm_flag["Lx"] = "INAT_MAKE_IMM(INAT_IMM_BYTE)"
> +	imm_flag["Lo"] = "INAT_MAKE_IMM(INAT_IMM_BYTE)"
>  
>  	modrm_expr = "^([CDEGMNPQRSUVW/][a-z]+|NTA|T[012])"
>  	force64_expr = "\\([df]64\\)"
> @@ -87,6 +91,8 @@ BEGIN {
>  	evexonly_expr = "\\(ev\\)"
>  	# (es) is the same as (ev) but also "SCALABLE" i.e. W and pp determine operand size
>  	evex_scalable_expr = "\\(es\\)"
> +	# All opcodes in XOP table or with (xop) superscript accept XOP prefix
> +	xopok_expr = "\\(xop\\)"
>  
>  	prefix_expr = "\\(Prefix\\)"
>  	prefix_num["Operand-Size"] = "INAT_PFX_OPNDSZ"
> @@ -106,6 +112,7 @@ BEGIN {
>  	prefix_num["VEX+2byte"] = "INAT_PFX_VEX3"
>  	prefix_num["EVEX"] = "INAT_PFX_EVEX"
>  	prefix_num["REX2"] = "INAT_PFX_REX2"
> +	prefix_num["XOP"] = "INAT_PFX_XOP"
>  
>  	clear_vars()
>  }
> @@ -147,6 +154,7 @@ function array_size(arr,   i,c) {
>  	if (NF != 1) {
>  		# AVX/escape opcode table
>  		aid = $2
> +		xopid = -1
>  		if (gaid <= aid)
>  			gaid = aid + 1
>  		if (tname == "")	# AVX only opcode table
> @@ -156,6 +164,20 @@ function array_size(arr,   i,c) {
>  		tname = "inat_primary_table"
>  }
>  
> +/^XOPcode:/ {
> +	if (NF != 1) {
> +		# XOP opcode table
> +		xopid = $2
> +		aid = -1
> +		if (gxopid <= xopid)
> +			gxopid = xopid + 1
> +		if (tname == "")	# XOP only opcode table
> +			tname = sprintf("inat_xop_table_%d", $2)
> +	}
> +	if (xopid == -1 && eid == -1)	# primary opcode table
> +		tname = "inat_primary_table"
> +}
> +
>  /^GrpTable:/ {
>  	print "/* " $0 " */"
>  	if (!($2 in group))
> @@ -206,6 +228,8 @@ function print_table(tbl,name,fmt,n)
>  			etable[eid,0] = tname
>  			if (aid >= 0)
>  				atable[aid,0] = tname
> +			else if (xopid >= 0)
> +				xoptable[xopid] = tname
>  		}
>  		if (array_size(lptable1) != 0) {
>  			print_table(lptable1,tname "_1[INAT_OPCODE_TABLE_SIZE]",
> @@ -347,6 +371,8 @@ function convert_operands(count,opnd,       i,j,imm,mod)
>  			flags = add_flags(flags, "INAT_VEXOK | INAT_VEXONLY")
>  		else if (match(ext, vexok_expr) || match(opcode, vexok_opcode_expr))
>  			flags = add_flags(flags, "INAT_VEXOK")
> +		else if (match(ext, xopok_expr) || xopid >= 0)
> +			flags = add_flags(flags, "INAT_XOPOK")
>  
>  		# check prefixes
>  		if (match(ext, prefix_expr)) {
> @@ -413,6 +439,14 @@ END {
>  				print "	["i"]["j"] = "atable[i,j]","
>  	print "};\n"
>  
> +	print "/* XOP opcode map array */"
> +	print "const insn_attr_t * const inat_xop_tables[X86_XOP_M_MAX - X86_XOP_M_MIN + 1]" \
> +	      " = {"
> +	for (i = 0; i < gxopid; i++)
> +		if (xoptable[i])
> +			print "	["i"] = "xoptable[i]","
> +	print "};"
> +
>  	print "#else /* !__BOOT_COMPRESSED */\n"
>  
>  	print "/* Escape opcode map array */"
> @@ -430,6 +464,10 @@ END {
>  	      "[INAT_LSTPFX_MAX + 1];"
>  	print ""
>  
> +	print "/* XOP opcode map array */"
> +	print "static const insn_attr_t *inat_xop_tables[X86_XOP_M_MAX - X86_XOP_M_MIN + 1];"
> +	print ""
> +
>  	print "static void inat_init_tables(void)"
>  	print "{"
>  
> @@ -455,6 +493,12 @@ END {
>  			if (atable[i,j])
>  				print "\tinat_avx_tables["i"]["j"] = "atable[i,j]";"
>  
> +	print ""
> +	print "\t/* Print XOP opcode map array */"
> +	for (i = 0; i < gxopid; i++)
> +		if (xoptable[i])
> +			print "\tinat_xop_tables["i"] = "xoptable[i]";"
> +
>  	print "}"
>  	print "#endif"
>  }
> diff --git a/tools/arch/x86/include/asm/inat.h b/tools/arch/x86/include/asm/inat.h
> index 183aa662b165..099e926595bd 100644
> --- a/tools/arch/x86/include/asm/inat.h
> +++ b/tools/arch/x86/include/asm/inat.h
> @@ -37,6 +37,8 @@
>  #define INAT_PFX_EVEX	15	/* EVEX prefix */
>  /* x86-64 REX2 prefix */
>  #define INAT_PFX_REX2	16	/* 0xD5 */
> +/* AMD XOP prefix */
> +#define INAT_PFX_XOP	17	/* 0x8F */
>  
>  #define INAT_LSTPFX_MAX	3
>  #define INAT_LGCPFX_MAX	11
> @@ -77,6 +79,7 @@
>  #define INAT_MOFFSET	(1 << (INAT_FLAG_OFFS + 3))
>  #define INAT_VARIANT	(1 << (INAT_FLAG_OFFS + 4))
>  #define INAT_VEXOK	(1 << (INAT_FLAG_OFFS + 5))
> +#define INAT_XOPOK	INAT_VEXOK
>  #define INAT_VEXONLY	(1 << (INAT_FLAG_OFFS + 6))
>  #define INAT_EVEXONLY	(1 << (INAT_FLAG_OFFS + 7))
>  #define INAT_NO_REX2	(1 << (INAT_FLAG_OFFS + 8))
> @@ -111,6 +114,8 @@ extern insn_attr_t inat_get_group_attribute(insn_byte_t modrm,
>  extern insn_attr_t inat_get_avx_attribute(insn_byte_t opcode,
>  					  insn_byte_t vex_m,
>  					  insn_byte_t vex_pp);
> +extern insn_attr_t inat_get_xop_attribute(insn_byte_t opcode,
> +					  insn_byte_t map_select);
>  
>  /* Attribute checking functions */
>  static inline int inat_is_legacy_prefix(insn_attr_t attr)
> @@ -164,6 +169,11 @@ static inline int inat_is_vex3_prefix(insn_attr_t attr)
>  	return (attr & INAT_PFX_MASK) == INAT_PFX_VEX3;
>  }
>  
> +static inline int inat_is_xop_prefix(insn_attr_t attr)
> +{
> +	return (attr & INAT_PFX_MASK) == INAT_PFX_XOP;
> +}
> +
>  static inline int inat_is_escape(insn_attr_t attr)
>  {
>  	return attr & INAT_ESC_MASK;
> @@ -229,6 +239,11 @@ static inline int inat_accept_vex(insn_attr_t attr)
>  	return attr & INAT_VEXOK;
>  }
>  
> +static inline int inat_accept_xop(insn_attr_t attr)
> +{
> +	return attr & INAT_XOPOK;
> +}
> +
>  static inline int inat_must_vex(insn_attr_t attr)
>  {
>  	return attr & (INAT_VEXONLY | INAT_EVEXONLY);
> diff --git a/tools/arch/x86/include/asm/insn.h b/tools/arch/x86/include/asm/insn.h
> index 0e5abd896ad4..c683d609934b 100644
> --- a/tools/arch/x86/include/asm/insn.h
> +++ b/tools/arch/x86/include/asm/insn.h
> @@ -71,7 +71,10 @@ struct insn {
>  					 * prefixes.bytes[3]: last prefix
>  					 */
>  	struct insn_field rex_prefix;	/* REX prefix */
> -	struct insn_field vex_prefix;	/* VEX prefix */
> +	union {
> +		struct insn_field vex_prefix;	/* VEX prefix */
> +		struct insn_field xop_prefix;	/* XOP prefix */
> +	};
>  	struct insn_field opcode;	/*
>  					 * opcode.bytes[0]: opcode1
>  					 * opcode.bytes[1]: opcode2
> @@ -135,6 +138,17 @@ struct insn {
>  #define X86_VEX_V(vex)	(((vex) & 0x78) >> 3)	/* VEX3 Byte2, VEX2 Byte1 */
>  #define X86_VEX_P(vex)	((vex) & 0x03)		/* VEX3 Byte2, VEX2 Byte1 */
>  #define X86_VEX_M_MAX	0x1f			/* VEX3.M Maximum value */
> +/* XOP bit fields */
> +#define X86_XOP_R(xop)	((xop) & 0x80)	/* XOP Byte2 */
> +#define X86_XOP_X(xop)	((xop) & 0x40)	/* XOP Byte2 */
> +#define X86_XOP_B(xop)	((xop) & 0x20)	/* XOP Byte2 */
> +#define X86_XOP_M(xop)	((xop) & 0x1f)	/* XOP Byte2 */
> +#define X86_XOP_W(xop)	((xop) & 0x80)	/* XOP Byte3 */
> +#define X86_XOP_V(xop)	((xop) & 0x78)	/* XOP Byte3 */
> +#define X86_XOP_L(xop)	((xop) & 0x04)	/* XOP Byte3 */
> +#define X86_XOP_P(xop)	((xop) & 0x03)	/* XOP Byte3 */
> +#define X86_XOP_M_MIN	0x08	/* Min of XOP.M */
> +#define X86_XOP_M_MAX	0x1f	/* Max of XOP.M */
>  
>  extern void insn_init(struct insn *insn, const void *kaddr, int buf_len, int x86_64);
>  extern int insn_get_prefixes(struct insn *insn);
> @@ -178,7 +192,7 @@ static inline insn_byte_t insn_rex2_m_bit(struct insn *insn)
>  	return X86_REX2_M(insn->rex_prefix.bytes[1]);
>  }
>  
> -static inline int insn_is_avx(struct insn *insn)
> +static inline int insn_is_avx_or_xop(struct insn *insn)
>  {
>  	if (!insn->prefixes.got)
>  		insn_get_prefixes(insn);
> @@ -192,6 +206,22 @@ static inline int insn_is_evex(struct insn *insn)
>  	return (insn->vex_prefix.nbytes == 4);
>  }
>  
> +/* If we already know this is AVX/XOP encoded */
> +static inline int avx_insn_is_xop(struct insn *insn)
> +{
> +	insn_attr_t attr = inat_get_opcode_attribute(insn->vex_prefix.bytes[0]);
> +
> +	return inat_is_xop_prefix(attr);
> +}
> +
> +static inline int insn_is_xop(struct insn *insn)
> +{
> +	if (!insn_is_avx_or_xop(insn))
> +		return 0;
> +
> +	return avx_insn_is_xop(insn);
> +}
> +
>  static inline int insn_has_emulate_prefix(struct insn *insn)
>  {
>  	return !!insn->emulate_prefix_size;
> @@ -222,11 +252,26 @@ static inline insn_byte_t insn_vex_w_bit(struct insn *insn)
>  	return X86_VEX_W(insn->vex_prefix.bytes[2]);
>  }
>  
> +static inline insn_byte_t insn_xop_map_bits(struct insn *insn)
> +{
> +	if (insn->xop_prefix.nbytes < 3)	/* XOP is 3 bytes */
> +		return 0;
> +	return X86_XOP_M(insn->xop_prefix.bytes[1]);
> +}
> +
> +static inline insn_byte_t insn_xop_p_bits(struct insn *insn)
> +{
> +	return X86_XOP_P(insn->vex_prefix.bytes[2]);
> +}
> +
>  /* Get the last prefix id from last prefix or VEX prefix */
>  static inline int insn_last_prefix_id(struct insn *insn)
>  {
> -	if (insn_is_avx(insn))
> +	if (insn_is_avx_or_xop(insn)) {
> +		if (avx_insn_is_xop(insn))
> +			return insn_xop_p_bits(insn);
>  		return insn_vex_p_bits(insn);	/* VEX_p is a SIMD prefix id */
> +	}
>  
>  	if (insn->prefixes.bytes[3])
>  		return inat_get_last_prefix_id(insn->prefixes.bytes[3]);
> diff --git a/tools/arch/x86/lib/inat.c b/tools/arch/x86/lib/inat.c
> index dfbcc6405941..ffcb0e27453b 100644
> --- a/tools/arch/x86/lib/inat.c
> +++ b/tools/arch/x86/lib/inat.c
> @@ -81,3 +81,16 @@ insn_attr_t inat_get_avx_attribute(insn_byte_t opcode, insn_byte_t vex_m,
>  	return table[opcode];
>  }
>  
> +insn_attr_t inat_get_xop_attribute(insn_byte_t opcode, insn_byte_t map_select)
> +{
> +	const insn_attr_t *table;
> +
> +	if (map_select < X86_XOP_M_MIN || map_select > X86_XOP_M_MAX)
> +		return 0;
> +	map_select -= X86_XOP_M_MIN;
> +	/* At first, this checks the master table */
> +	table = inat_xop_tables[map_select];
> +	if (!table)
> +		return 0;
> +	return table[opcode];
> +}
> diff --git a/tools/arch/x86/lib/insn.c b/tools/arch/x86/lib/insn.c
> index bce69c6bfa69..1d1c57c74d1f 100644
> --- a/tools/arch/x86/lib/insn.c
> +++ b/tools/arch/x86/lib/insn.c
> @@ -200,12 +200,15 @@ int insn_get_prefixes(struct insn *insn)
>  	}
>  	insn->rex_prefix.got = 1;
>  
> -	/* Decode VEX prefix */
> +	/* Decode VEX/XOP prefix */
>  	b = peek_next(insn_byte_t, insn);
> -	attr = inat_get_opcode_attribute(b);
> -	if (inat_is_vex_prefix(attr)) {
> +	if (inat_is_vex_prefix(attr) || inat_is_xop_prefix(attr)) {
>  		insn_byte_t b2 = peek_nbyte_next(insn_byte_t, insn, 1);
> -		if (!insn->x86_64) {
> +
> +		if (inat_is_xop_prefix(attr) && X86_MODRM_REG(b2) == 0) {
> +			/* Grp1A.0 is always POP Ev */
> +			goto vex_end;
> +		} else if (!insn->x86_64) {
>  			/*
>  			 * In 32-bits mode, if the [7:6] bits (mod bits of
>  			 * ModRM) on the second byte are not 11b, it is
> @@ -226,13 +229,13 @@ int insn_get_prefixes(struct insn *insn)
>  			if (insn->x86_64 && X86_VEX_W(b2))
>  				/* VEX.W overrides opnd_size */
>  				insn->opnd_bytes = 8;
> -		} else if (inat_is_vex3_prefix(attr)) {
> +		} else if (inat_is_vex3_prefix(attr) || inat_is_xop_prefix(attr)) {
>  			b2 = peek_nbyte_next(insn_byte_t, insn, 2);
>  			insn_set_byte(&insn->vex_prefix, 2, b2);
>  			insn->vex_prefix.nbytes = 3;
>  			insn->next_byte += 3;
>  			if (insn->x86_64 && X86_VEX_W(b2))
> -				/* VEX.W overrides opnd_size */
> +				/* VEX.W/XOP.W overrides opnd_size */
>  				insn->opnd_bytes = 8;
>  		} else {
>  			/*
> @@ -288,9 +291,22 @@ int insn_get_opcode(struct insn *insn)
>  	insn_set_byte(opcode, 0, op);
>  	opcode->nbytes = 1;
>  
> -	/* Check if there is VEX prefix or not */
> -	if (insn_is_avx(insn)) {
> +	/* Check if there is VEX/XOP prefix or not */
> +	if (insn_is_avx_or_xop(insn)) {
>  		insn_byte_t m, p;
> +
> +		/* XOP prefix has different encoding */
> +		if (unlikely(avx_insn_is_xop(insn))) {
> +			m = insn_xop_map_bits(insn);
> +			insn->attr = inat_get_xop_attribute(op, m);
> +			if (!inat_accept_xop(insn->attr)) {
> +				insn->attr = 0;
> +				return -EINVAL;
> +			}
> +			/* XOP has only 1 byte for opcode */
> +			goto end;
> +		}
> +
>  		m = insn_vex_m_bits(insn);
>  		p = insn_vex_p_bits(insn);
>  		insn->attr = inat_get_avx_attribute(op, m, p);
> @@ -383,7 +399,8 @@ int insn_get_modrm(struct insn *insn)
>  			pfx_id = insn_last_prefix_id(insn);
>  			insn->attr = inat_get_group_attribute(mod, pfx_id,
>  							      insn->attr);
> -			if (insn_is_avx(insn) && !inat_accept_vex(insn->attr)) {
> +			if (insn_is_avx_or_xop(insn) && !inat_accept_vex(insn->attr) &&
> +			    !inat_accept_xop(insn->attr)) {
>  				/* Bad insn */
>  				insn->attr = 0;
>  				return -EINVAL;
> diff --git a/tools/arch/x86/lib/x86-opcode-map.txt b/tools/arch/x86/lib/x86-opcode-map.txt
> index 262f7ca1fb95..2a4e69ecc2de 100644
> --- a/tools/arch/x86/lib/x86-opcode-map.txt
> +++ b/tools/arch/x86/lib/x86-opcode-map.txt
> @@ -27,6 +27,11 @@
>  #  (evo): this opcode is changed by EVEX prefix (EVEX opcode)
>  #  (v): this opcode requires VEX prefix.
>  #  (v1): this opcode only supports 128bit VEX.
> +#  (xop): this opcode accepts XOP prefix.
> +#
> +# XOP Superscripts
> +#  (W=0): this opcode requires XOP.W == 0
> +#  (W=1): this opcode requires XOP.W == 1
>  #
>  # Last Prefix Superscripts
>  #  - (66): the last prefix is 0x66
> @@ -194,7 +199,7 @@ AVXcode:
>  8c: MOV Ev,Sw
>  8d: LEA Gv,M
>  8e: MOV Sw,Ew
> -8f: Grp1A (1A) | POP Ev (d64)
> +8f: Grp1A (1A) | POP Ev (d64) | XOP (Prefix)
>  # 0x90 - 0x9f
>  90: NOP | PAUSE (F3) | XCHG r8,rAX
>  91: XCHG rCX/r9,rAX
> @@ -1106,6 +1111,84 @@ AVXcode: 7
>  f8: URDMSR Rq,Id (F2),(v1),(11B) | UWRMSR Id,Rq (F3),(v1),(11B)
>  EndTable
>  
> +# From AMD64 Architecture Programmer's Manual Vol3, Appendix A.1.5
> +Table: XOP map 8h
> +Referrer:
> +XOPcode: 0
> +85: VPMACSSWW Vo,Ho,Wo,Lo
> +86: VPMACSSWD Vo,Ho,Wo,Lo
> +87: VPMACSSDQL Vo,Ho,Wo,Lo
> +8e: VPMACSSDD Vo,Ho,Wo,Lo
> +8f: VPMACSSDQH Vo,Ho,Wo,Lo
> +95: VPMACSWW Vo,Ho,Wo,Lo
> +96: VPMACSWD Vo,Ho,Wo,Lo
> +97: VPMACSDQL Vo,Ho,Wo,Lo
> +9e: VPMACSDD Vo,Ho,Wo,Lo
> +9f: VPMACSDQH Vo,Ho,Wo,Lo
> +a2: VPCMOV Vx,Hx,Wx,Lx (W=0) | VPCMOV Vx,Hx,Lx,Wx (W=1)
> +a3: VPPERM Vo,Ho,Wo,Lo (W=0) | VPPERM Vo,Ho,Lo,Wo (W=1)
> +a6: VPMADCSSWD Vo,Ho,Wo,Lo
> +b6: VPMADCSWD Vo,Ho,Wo,Lo
> +c0: VPROTB Vo,Wo,Ib
> +c1: VPROTW Vo,Wo,Ib
> +c2: VPROTD Vo,Wo,Ib
> +c3: VPROTQ Vo,Wo,Ib
> +cc: VPCOMccB Vo,Ho,Wo,Ib
> +cd: VPCOMccW Vo,Ho,Wo,Ib
> +ce: VPCOMccD Vo,Ho,Wo,Ib
> +cf: VPCOMccQ Vo,Ho,Wo,Ib
> +ec: VPCOMccUB Vo,Ho,Wo,Ib
> +ed: VPCOMccUW Vo,Ho,Wo,Ib
> +ee: VPCOMccUD Vo,Ho,Wo,Ib
> +ef: VPCOMccUQ Vo,Ho,Wo,Ib
> +EndTable
> +
> +Table: XOP map 9h
> +Referrer:
> +XOPcode: 1
> +01: GrpXOP1
> +02: GrpXOP2
> +12: GrpXOP3
> +80: VFRCZPS Vx,Wx
> +81: VFRCZPD Vx,Wx
> +82: VFRCZSS Vq,Wss
> +83: VFRCZSD Vq,Wsd
> +90: VPROTB Vo,Wo,Ho (W=0) | VPROTB Vo,Ho,Wo (W=1)
> +91: VPROTW Vo,Wo,Ho (W=0) | VPROTB Vo,Ho,Wo (W=1)
> +92: VPROTD Vo,Wo,Ho (W=0) | VPROTB Vo,Ho,Wo (W=1)
> +93: VPROTQ Vo,Wo,Ho (W=0) | VPROTB Vo,Ho,Wo (W=1)
> +94: VPSHLB Vo,Wo,Ho (W=0) | VPSHLB Vo,Ho,Wo (W=1)
> +95: VPSHLW Vo,Wo,Ho (W=0) | VPSHLW Vo,Ho,Wo (W=1)
> +96: VPSHLD Vo,Wo,Ho (W=0) | VPSHLD Vo,Ho,Wo (W=1)
> +97: VPSHLQ Vo,Wo,Ho (W=0) | VPSHLQ Vo,Ho,Wo (W=1)
> +98: VPSHAB Vo,Wo,Ho (W=0) | VPSHAB Vo,Ho,Wo (W=1)
> +99: VPSHAW Vo,Wo,Ho (W=0) | VPSHAW Vo,Ho,Wo (W=1)
> +9a: VPSHAD Vo,Wo,Ho (W=0) | VPSHAD Vo,Ho,Wo (W=1)
> +9b: VPSHAQ Vo,Wo,Ho (W=0) | VPSHAQ Vo,Ho,Wo (W=1)
> +c1: VPHADDBW Vo,Wo
> +c2: VPHADDBD Vo,Wo
> +c3: VPHADDBQ Vo,Wo
> +c6: VPHADDWD Vo,Wo
> +c7: VPHADDWQ Vo,Wo
> +cb: VPHADDDQ Vo,Wo
> +d1: VPHADDUBWD Vo,Wo
> +d2: VPHADDUBD Vo,Wo
> +d3: VPHADDUBQ Vo,Wo
> +d6: VPHADDUWD Vo,Wo
> +d7: VPHADDUWQ Vo,Wo
> +db: VPHADDUDQ Vo,Wo
> +e1: VPHSUBBW Vo,Wo
> +e2: VPHSUBWD Vo,Wo
> +e3: VPHSUBDQ Vo,Wo
> +EndTable
> +
> +Table: XOP map Ah
> +Referrer:
> +XOPcode: 2
> +10: BEXTR Gy,Ey,Id
> +12: GrpXOP4
> +EndTable
> +
>  GrpTable: Grp1
>  0: ADD
>  1: OR
> @@ -1320,3 +1403,29 @@ GrpTable: GrpRNG
>  4: xcrypt-cfb
>  5: xcrypt-ofb
>  EndTable
> +
> +# GrpXOP1-4 is shown in AMD APM Vol.3 Appendix A as XOP group #1-4
> +GrpTable: GrpXOP1
> +1: BLCFILL By,Ey (xop)
> +2: BLSFILL By,Ey (xop)
> +3: BLCS By,Ey (xop)
> +4: TZMSK By,Ey (xop)
> +5: BLCIC By,Ey (xop)
> +6: BLSIC By,Ey (xop)
> +7: T1MSKC By,Ey (xop)
> +EndTable
> +
> +GrpTable: GrpXOP2
> +1: BLCMSK By,Ey (xop)
> +6: BLCI By,Ey (xop)
> +EndTable
> +
> +GrpTable: GrpXOP3
> +0: LLWPCB Ry (xop)
> +1: SLWPCB Ry (xop)
> +EndTable
> +
> +GrpTable: GrpXOP4
> +0: LWPINS By,Ed,Id (xop)
> +1: LWPVAL By,Ed,Id (xop)
> +EndTable
> diff --git a/tools/arch/x86/tools/gen-insn-attr-x86.awk b/tools/arch/x86/tools/gen-insn-attr-x86.awk
> index 2c19d7fc8a85..7ea1b75e59b7 100644
> --- a/tools/arch/x86/tools/gen-insn-attr-x86.awk
> +++ b/tools/arch/x86/tools/gen-insn-attr-x86.awk
> @@ -21,6 +21,7 @@ function clear_vars() {
>  	eid = -1 # escape id
>  	gid = -1 # group id
>  	aid = -1 # AVX id
> +	xopid = -1 # XOP id
>  	tname = ""
>  }
>  
> @@ -39,9 +40,11 @@ BEGIN {
>  	ggid = 1
>  	geid = 1
>  	gaid = 0
> +	gxopid = 0
>  	delete etable
>  	delete gtable
>  	delete atable
> +	delete xoptable
>  
>  	opnd_expr = "^[A-Za-z/]"
>  	ext_expr = "^\\("
> @@ -61,6 +64,7 @@ BEGIN {
>  	imm_flag["Ob"] = "INAT_MOFFSET"
>  	imm_flag["Ov"] = "INAT_MOFFSET"
>  	imm_flag["Lx"] = "INAT_MAKE_IMM(INAT_IMM_BYTE)"
> +	imm_flag["Lo"] = "INAT_MAKE_IMM(INAT_IMM_BYTE)"
>  
>  	modrm_expr = "^([CDEGMNPQRSUVW/][a-z]+|NTA|T[012])"
>  	force64_expr = "\\([df]64\\)"
> @@ -87,6 +91,8 @@ BEGIN {
>  	evexonly_expr = "\\(ev\\)"
>  	# (es) is the same as (ev) but also "SCALABLE" i.e. W and pp determine operand size
>  	evex_scalable_expr = "\\(es\\)"
> +	# All opcodes in XOP table or with (xop) superscript accept XOP prefix
> +	xopok_expr = "\\(xop\\)"
>  
>  	prefix_expr = "\\(Prefix\\)"
>  	prefix_num["Operand-Size"] = "INAT_PFX_OPNDSZ"
> @@ -106,6 +112,7 @@ BEGIN {
>  	prefix_num["VEX+2byte"] = "INAT_PFX_VEX3"
>  	prefix_num["EVEX"] = "INAT_PFX_EVEX"
>  	prefix_num["REX2"] = "INAT_PFX_REX2"
> +	prefix_num["XOP"] = "INAT_PFX_XOP"
>  
>  	clear_vars()
>  }
> @@ -147,6 +154,7 @@ function array_size(arr,   i,c) {
>  	if (NF != 1) {
>  		# AVX/escape opcode table
>  		aid = $2
> +		xopid = -1
>  		if (gaid <= aid)
>  			gaid = aid + 1
>  		if (tname == "")	# AVX only opcode table
> @@ -156,6 +164,20 @@ function array_size(arr,   i,c) {
>  		tname = "inat_primary_table"
>  }
>  
> +/^XOPcode:/ {
> +	if (NF != 1) {
> +		# XOP opcode table
> +		xopid = $2
> +		aid = -1
> +		if (gxopid <= xopid)
> +			gxopid = xopid + 1
> +		if (tname == "")	# XOP only opcode table
> +			tname = sprintf("inat_xop_table_%d", $2)
> +	}
> +	if (xopid == -1 && eid == -1)	# primary opcode table
> +		tname = "inat_primary_table"
> +}
> +
>  /^GrpTable:/ {
>  	print "/* " $0 " */"
>  	if (!($2 in group))
> @@ -206,6 +228,8 @@ function print_table(tbl,name,fmt,n)
>  			etable[eid,0] = tname
>  			if (aid >= 0)
>  				atable[aid,0] = tname
> +			else if (xopid >= 0)
> +				xoptable[xopid] = tname
>  		}
>  		if (array_size(lptable1) != 0) {
>  			print_table(lptable1,tname "_1[INAT_OPCODE_TABLE_SIZE]",
> @@ -347,6 +371,8 @@ function convert_operands(count,opnd,       i,j,imm,mod)
>  			flags = add_flags(flags, "INAT_VEXOK | INAT_VEXONLY")
>  		else if (match(ext, vexok_expr) || match(opcode, vexok_opcode_expr))
>  			flags = add_flags(flags, "INAT_VEXOK")
> +		else if (match(ext, xopok_expr) || xopid >= 0)
> +			flags = add_flags(flags, "INAT_XOPOK")
>  
>  		# check prefixes
>  		if (match(ext, prefix_expr)) {
> @@ -413,6 +439,14 @@ END {
>  				print "	["i"]["j"] = "atable[i,j]","
>  	print "};\n"
>  
> +	print "/* XOP opcode map array */"
> +	print "const insn_attr_t * const inat_xop_tables[X86_XOP_M_MAX - X86_XOP_M_MIN + 1]" \
> +	      " = {"
> +	for (i = 0; i < gxopid; i++)
> +		if (xoptable[i])
> +			print "	["i"] = "xoptable[i]","
> +	print "};"
> +
>  	print "#else /* !__BOOT_COMPRESSED */\n"
>  
>  	print "/* Escape opcode map array */"
> @@ -430,6 +464,10 @@ END {
>  	      "[INAT_LSTPFX_MAX + 1];"
>  	print ""
>  
> +	print "/* XOP opcode map array */"
> +	print "static const insn_attr_t *inat_xop_tables[X86_XOP_M_MAX - X86_XOP_M_MIN + 1];"
> +	print ""
> +
>  	print "static void inat_init_tables(void)"
>  	print "{"
>  
> @@ -455,6 +493,12 @@ END {
>  			if (atable[i,j])
>  				print "\tinat_avx_tables["i"]["j"] = "atable[i,j]";"
>  
> +	print ""
> +	print "\t/* Print XOP opcode map array */"
> +	for (i = 0; i < gxopid; i++)
> +		if (xoptable[i])
> +			print "\tinat_xop_tables["i"] = "xoptable[i]";"
> +
>  	print "}"
>  	print "#endif"
>  }
> diff --git a/tools/perf/util/intel-pt-decoder/intel-pt-insn-decoder.c b/tools/perf/util/intel-pt-decoder/intel-pt-insn-decoder.c
> index 8fabddc1c0da..72c7a4e15d61 100644
> --- a/tools/perf/util/intel-pt-decoder/intel-pt-insn-decoder.c
> +++ b/tools/perf/util/intel-pt-decoder/intel-pt-insn-decoder.c
> @@ -32,7 +32,7 @@ static void intel_pt_insn_decoder(struct insn *insn,
>  	intel_pt_insn->rel = 0;
>  	intel_pt_insn->emulated_ptwrite = false;
>  
> -	if (insn_is_avx(insn)) {
> +	if (insn_is_avx_or_xop(insn)) {
>  		intel_pt_insn->op = INTEL_PT_OP_OTHER;
>  		intel_pt_insn->branch = INTEL_PT_BR_NO_BRANCH;
>  		intel_pt_insn->length = insn->length;
> 


-- 
Masami Hiramatsu (Google) <mhiramat@...nel.org>