[<prev] [next>] [<thread-prev] [day] [month] [year] [list]
Message-ID: <20250429085005.GE4198@noisy.programming.kicks-ass.net>
Date: Tue, 29 Apr 2025 10:50:05 +0200
From: Peter Zijlstra <peterz@...radead.org>
To: "Masami Hiramatsu (Google)" <mhiramat@...nel.org>
Cc: Ingo Molnar <mingo@...hat.com>, Thomas Gleixner <tglx@...utronix.de>,
Borislav Petkov <bp@...en8.de>,
Dave Hansen <dave.hansen@...ux.intel.com>, x86@...nel.org,
"H . Peter Anvin" <hpa@...or.com>, linux-kernel@...r.kernel.org,
Adrian Hunter <adrian.hunter@...el.com>
Subject: Re: [PATCH 2/2] x86: Stop decoding i64 instructions in x86-64 mode
at opcode
On Mon, Apr 28, 2025 at 10:48:20AM +0900, Masami Hiramatsu (Google) wrote:
> From: Masami Hiramatsu (Google) <mhiramat@...nel.org>
>
> In commit 2e044911be75 ("x86/traps: Decode 0xEA instructions as #UD")
> FineIBT starts using 0xEA as an invalid instruction like UD2. But
> insn decoder always returns the length of "0xea" instruction is 7
> because it does not check (i64) superscript.
> The x86 instruction decoder should also decode 0xEA on x86-64 as
> one-byte invalid instruction by decoding "(i64)" superscript tag.
>
> This stops decoding instruction which has (i64) but not have (o64)
> superscript in 64bit mode at opcode and skip other fields.
>
> With this change, insn_decoder_test says 0xea is 1 byte length if
> x86-64 (-y option means 64bit).
> -----
> > printf "0:\tea\t\n" | insn_decoder_test -y -v
> insn_decoder_test: success: Decoded and checked 1 instructions
> -----
Notably matching objdump's decode behaviour in this case.
Thanks!
Reported-by: Peter Zijlstra (Intel) <peterz@...radead.org>
Tested-by: Peter Zijlstra (Intel) <peterz@...radead.org>
>
> Signed-off-by: Masami Hiramatsu (Google) <mhiramat@...nel.org>
> ---
> arch/x86/include/asm/inat.h | 6 ++++++
> arch/x86/lib/insn.c | 7 ++++++-
> arch/x86/lib/x86-opcode-map.txt | 6 +++---
> arch/x86/tools/gen-insn-attr-x86.awk | 7 +++++++
> tools/arch/x86/include/asm/inat.h | 6 ++++++
> tools/arch/x86/lib/insn.c | 7 ++++++-
> tools/arch/x86/lib/x86-opcode-map.txt | 6 +++---
> tools/arch/x86/tools/gen-insn-attr-x86.awk | 7 +++++++
> 8 files changed, 44 insertions(+), 8 deletions(-)
>
> diff --git a/arch/x86/include/asm/inat.h b/arch/x86/include/asm/inat.h
> index 53e4015242b4..97f341777db5 100644
> --- a/arch/x86/include/asm/inat.h
> +++ b/arch/x86/include/asm/inat.h
> @@ -82,6 +82,7 @@
> #define INAT_NO_REX2 (1 << (INAT_FLAG_OFFS + 8))
> #define INAT_REX2_VARIANT (1 << (INAT_FLAG_OFFS + 9))
> #define INAT_EVEX_SCALABLE (1 << (INAT_FLAG_OFFS + 10))
> +#define INAT_INV64 (1 << (INAT_FLAG_OFFS + 11))
> /* Attribute making macros for attribute tables */
> #define INAT_MAKE_PREFIX(pfx) (pfx << INAT_PFX_OFFS)
> #define INAT_MAKE_ESCAPE(esc) (esc << INAT_ESC_OFFS)
> @@ -242,4 +243,9 @@ static inline int inat_evex_scalable(insn_attr_t attr)
> {
> return attr & INAT_EVEX_SCALABLE;
> }
> +
> +static inline int inat_is_invalid64(insn_attr_t attr)
> +{
> + return attr & INAT_INV64;
> +}
> #endif
> diff --git a/arch/x86/lib/insn.c b/arch/x86/lib/insn.c
> index 6ffb931b9fb1..149a57e334ab 100644
> --- a/arch/x86/lib/insn.c
> +++ b/arch/x86/lib/insn.c
> @@ -324,6 +324,11 @@ int insn_get_opcode(struct insn *insn)
> }
>
> insn->attr = inat_get_opcode_attribute(op);
> + if (insn->x86_64 && inat_is_invalid64(insn->attr)) {
> + /* This instruction is invalid, like UD2. Stop decoding. */
> + insn->attr &= INAT_INV64;
> + }
> +
> while (inat_is_escape(insn->attr)) {
> /* Get escaped opcode */
> op = get_next(insn_byte_t, insn);
> @@ -337,6 +342,7 @@ int insn_get_opcode(struct insn *insn)
> insn->attr = 0;
> return -EINVAL;
> }
> +
> end:
> opcode->got = 1;
> return 0;
> @@ -658,7 +664,6 @@ int insn_get_immediate(struct insn *insn)
> }
>
> if (!inat_has_immediate(insn->attr))
> - /* no immediates */
> goto done;
>
> switch (inat_immediate_size(insn->attr)) {
> diff --git a/arch/x86/lib/x86-opcode-map.txt b/arch/x86/lib/x86-opcode-map.txt
> index 5e2fa3f7128e..de0be0462190 100644
> --- a/arch/x86/lib/x86-opcode-map.txt
> +++ b/arch/x86/lib/x86-opcode-map.txt
> @@ -147,7 +147,7 @@ AVXcode:
> # 0x60 - 0x6f
> 60: PUSHA/PUSHAD (i64)
> 61: POPA/POPAD (i64)
> -62: BOUND Gv,Ma (i64) | EVEX (Prefix)
> +62: BOUND Gv,Ma (i64) | EVEX (Prefix),(o64)
> 63: ARPL Ew,Gw (i64) | MOVSXD Gv,Ev (o64)
> 64: SEG=FS (Prefix)
> 65: SEG=GS (Prefix)
> @@ -253,8 +253,8 @@ c0: Grp2 Eb,Ib (1A)
> c1: Grp2 Ev,Ib (1A)
> c2: RETN Iw (f64)
> c3: RETN
> -c4: LES Gz,Mp (i64) | VEX+2byte (Prefix)
> -c5: LDS Gz,Mp (i64) | VEX+1byte (Prefix)
> +c4: LES Gz,Mp (i64) | VEX+2byte (Prefix),(o64)
> +c5: LDS Gz,Mp (i64) | VEX+1byte (Prefix),(o64)
> c6: Grp11A Eb,Ib (1A)
> c7: Grp11B Ev,Iz (1A)
> c8: ENTER Iw,Ib
> diff --git a/arch/x86/tools/gen-insn-attr-x86.awk b/arch/x86/tools/gen-insn-attr-x86.awk
> index 5770c8097f32..29e939893082 100644
> --- a/arch/x86/tools/gen-insn-attr-x86.awk
> +++ b/arch/x86/tools/gen-insn-attr-x86.awk
> @@ -64,6 +64,8 @@ BEGIN {
>
> modrm_expr = "^([CDEGMNPQRSUVW/][a-z]+|NTA|T[012])"
> force64_expr = "\\([df]64\\)"
> + invalid64_expr = "\\(i64\\)"
> + only64_expr = "\\(o64\\)"
> rex_expr = "^((REX(\\.[XRWB]+)+)|(REX$))"
> rex2_expr = "\\(REX2\\)"
> no_rex2_expr = "\\(!REX2\\)"
> @@ -319,6 +321,11 @@ function convert_operands(count,opnd, i,j,imm,mod)
> if (match(ext, force64_expr))
> flags = add_flags(flags, "INAT_FORCE64")
>
> + # check invalid in 64bit (and no only64)
> + if (match(ext, invalid64_expr) &&
> + !match($0, only64_expr))
> + flags = add_flags(flags, "INAT_INV64")
> +
> # check REX2 not allowed
> if (match(ext, no_rex2_expr))
> flags = add_flags(flags, "INAT_NO_REX2")
> diff --git a/tools/arch/x86/include/asm/inat.h b/tools/arch/x86/include/asm/inat.h
> index 253690eb3c26..183aa662b165 100644
> --- a/tools/arch/x86/include/asm/inat.h
> +++ b/tools/arch/x86/include/asm/inat.h
> @@ -82,6 +82,7 @@
> #define INAT_NO_REX2 (1 << (INAT_FLAG_OFFS + 8))
> #define INAT_REX2_VARIANT (1 << (INAT_FLAG_OFFS + 9))
> #define INAT_EVEX_SCALABLE (1 << (INAT_FLAG_OFFS + 10))
> +#define INAT_INV64 (1 << (INAT_FLAG_OFFS + 11))
> /* Attribute making macros for attribute tables */
> #define INAT_MAKE_PREFIX(pfx) (pfx << INAT_PFX_OFFS)
> #define INAT_MAKE_ESCAPE(esc) (esc << INAT_ESC_OFFS)
> @@ -242,4 +243,9 @@ static inline int inat_evex_scalable(insn_attr_t attr)
> {
> return attr & INAT_EVEX_SCALABLE;
> }
> +
> +static inline int inat_is_invalid64(insn_attr_t attr)
> +{
> + return attr & INAT_INV64;
> +}
> #endif
> diff --git a/tools/arch/x86/lib/insn.c b/tools/arch/x86/lib/insn.c
> index e91d4c4e1c16..bce69c6bfa69 100644
> --- a/tools/arch/x86/lib/insn.c
> +++ b/tools/arch/x86/lib/insn.c
> @@ -324,6 +324,11 @@ int insn_get_opcode(struct insn *insn)
> }
>
> insn->attr = inat_get_opcode_attribute(op);
> + if (insn->x86_64 && inat_is_invalid64(insn->attr)) {
> + /* This instruction is invalid, like UD2. Stop decoding. */
> + insn->attr &= INAT_INV64;
> + }
> +
> while (inat_is_escape(insn->attr)) {
> /* Get escaped opcode */
> op = get_next(insn_byte_t, insn);
> @@ -337,6 +342,7 @@ int insn_get_opcode(struct insn *insn)
> insn->attr = 0;
> return -EINVAL;
> }
> +
> end:
> opcode->got = 1;
> return 0;
> @@ -658,7 +664,6 @@ int insn_get_immediate(struct insn *insn)
> }
>
> if (!inat_has_immediate(insn->attr))
> - /* no immediates */
> goto done;
>
> switch (inat_immediate_size(insn->attr)) {
> diff --git a/tools/arch/x86/lib/x86-opcode-map.txt b/tools/arch/x86/lib/x86-opcode-map.txt
> index 5e2fa3f7128e..de0be0462190 100644
> --- a/tools/arch/x86/lib/x86-opcode-map.txt
> +++ b/tools/arch/x86/lib/x86-opcode-map.txt
> @@ -147,7 +147,7 @@ AVXcode:
> # 0x60 - 0x6f
> 60: PUSHA/PUSHAD (i64)
> 61: POPA/POPAD (i64)
> -62: BOUND Gv,Ma (i64) | EVEX (Prefix)
> +62: BOUND Gv,Ma (i64) | EVEX (Prefix),(o64)
> 63: ARPL Ew,Gw (i64) | MOVSXD Gv,Ev (o64)
> 64: SEG=FS (Prefix)
> 65: SEG=GS (Prefix)
> @@ -253,8 +253,8 @@ c0: Grp2 Eb,Ib (1A)
> c1: Grp2 Ev,Ib (1A)
> c2: RETN Iw (f64)
> c3: RETN
> -c4: LES Gz,Mp (i64) | VEX+2byte (Prefix)
> -c5: LDS Gz,Mp (i64) | VEX+1byte (Prefix)
> +c4: LES Gz,Mp (i64) | VEX+2byte (Prefix),(o64)
> +c5: LDS Gz,Mp (i64) | VEX+1byte (Prefix),(o64)
> c6: Grp11A Eb,Ib (1A)
> c7: Grp11B Ev,Iz (1A)
> c8: ENTER Iw,Ib
> diff --git a/tools/arch/x86/tools/gen-insn-attr-x86.awk b/tools/arch/x86/tools/gen-insn-attr-x86.awk
> index 5770c8097f32..29e939893082 100644
> --- a/tools/arch/x86/tools/gen-insn-attr-x86.awk
> +++ b/tools/arch/x86/tools/gen-insn-attr-x86.awk
> @@ -64,6 +64,8 @@ BEGIN {
>
> modrm_expr = "^([CDEGMNPQRSUVW/][a-z]+|NTA|T[012])"
> force64_expr = "\\([df]64\\)"
> + invalid64_expr = "\\(i64\\)"
> + only64_expr = "\\(o64\\)"
> rex_expr = "^((REX(\\.[XRWB]+)+)|(REX$))"
> rex2_expr = "\\(REX2\\)"
> no_rex2_expr = "\\(!REX2\\)"
> @@ -319,6 +321,11 @@ function convert_operands(count,opnd, i,j,imm,mod)
> if (match(ext, force64_expr))
> flags = add_flags(flags, "INAT_FORCE64")
>
> + # check invalid in 64bit (and no only64)
> + if (match(ext, invalid64_expr) &&
> + !match($0, only64_expr))
> + flags = add_flags(flags, "INAT_INV64")
> +
> # check REX2 not allowed
> if (match(ext, no_rex2_expr))
> flags = add_flags(flags, "INAT_NO_REX2")
>
Powered by blists - more mailing lists