Add insn_is_fpu(insn) which tells that the insn is whether touch the FPU/SSE/MMX register or the instruction of FP coprocessor. Signed-off-by: Masami Hiramatsu <mhiramat@xxxxxxxxxx> --- Changes in v3: - Add {FPU} to FWAIT/WAIT and FEMMS. - Split INAT_FPU and INAT_MODRM. - Remove a blank line typo. --- arch/x86/include/asm/inat.h | 7 +++ arch/x86/include/asm/insn.h | 12 ++++++ arch/x86/lib/x86-opcode-map.txt | 36 ++++++++++------- arch/x86/tools/gen-insn-attr-x86.awk | 58 +++++++++++++++++++++++++--- tools/arch/x86/include/asm/inat.h | 7 +++ tools/arch/x86/include/asm/insn.h | 12 ++++++ tools/arch/x86/lib/x86-opcode-map.txt | 36 ++++++++++------- tools/arch/x86/tools/gen-insn-attr-x86.awk | 58 +++++++++++++++++++++++++--- 8 files changed, 182 insertions(+), 44 deletions(-) diff --git a/arch/x86/include/asm/inat.h b/arch/x86/include/asm/inat.h index 4cf2ad521f65..ffce45178c08 100644 --- a/arch/x86/include/asm/inat.h +++ b/arch/x86/include/asm/inat.h @@ -77,6 +77,8 @@ #define INAT_VEXOK (1 << (INAT_FLAG_OFFS + 5)) #define INAT_VEXONLY (1 << (INAT_FLAG_OFFS + 6)) #define INAT_EVEXONLY (1 << (INAT_FLAG_OFFS + 7)) +#define INAT_FPU (1 << (INAT_FLAG_OFFS + 8)) +#define INAT_FPUIFVEX (1 << (INAT_FLAG_OFFS + 9)) /* Attribute making macros for attribute tables */ #define INAT_MAKE_PREFIX(pfx) (pfx << INAT_PFX_OFFS) #define INAT_MAKE_ESCAPE(esc) (esc << INAT_ESC_OFFS) @@ -227,4 +229,9 @@ static inline int inat_must_evex(insn_attr_t attr) { return attr & INAT_EVEXONLY; } + +static inline int inat_is_fpu(insn_attr_t attr) +{ + return attr & INAT_FPU; +} #endif diff --git a/arch/x86/include/asm/insn.h b/arch/x86/include/asm/insn.h index 5c1ae3eff9d4..1752c54d2103 100644 --- a/arch/x86/include/asm/insn.h +++ b/arch/x86/include/asm/insn.h @@ -129,6 +129,18 @@ static inline int insn_is_evex(struct insn *insn) return (insn->vex_prefix.nbytes == 4); } +static inline int insn_is_fpu(struct insn *insn) +{ + if (!insn->opcode.got) + insn_get_opcode(insn); + if (inat_is_fpu(insn->attr)) { + if (insn->attr & INAT_FPUIFVEX) + return insn_is_avx(insn); + return 1; + } + return 0; +} + static inline int insn_has_emulate_prefix(struct insn *insn) { return !!insn->emulate_prefix_size; diff --git a/arch/x86/lib/x86-opcode-map.txt b/arch/x86/lib/x86-opcode-map.txt index ec31f5b60323..0adf11cbd3a8 100644 --- a/arch/x86/lib/x86-opcode-map.txt +++ b/arch/x86/lib/x86-opcode-map.txt @@ -33,6 +33,10 @@ # - (F2): the last prefix is 0xF2 # - (!F3) : the last prefix is not 0xF3 (including non-last prefix case) # - (66&F2): Both 0x66 and 0xF2 prefixes are specified. +# +# Optional Superscripts +# - {FPU}: this mnemonic doesn't have FPU/MMX/SSE operands but access those +# registers. Table: one byte opcode Referrer: @@ -202,7 +206,7 @@ AVXcode: 98: CBW/CWDE/CDQE 99: CWD/CDQ/CQO 9a: CALLF Ap (i64) -9b: FWAIT/WAIT +9b: FWAIT/WAIT {FPU} 9c: PUSHF/D/Q Fv (d64) 9d: POPF/D/Q Fv (d64) 9e: SAHF @@ -269,14 +273,16 @@ d4: AAM Ib (i64) d5: AAD Ib (i64) d6: d7: XLAT/XLATB -d8: ESC -d9: ESC -da: ESC -db: ESC -dc: ESC -dd: ESC -de: ESC -df: ESC +# Intel SDM Appendix A Opcode Map shows these opcode are ESC (Escape to +# coprocessor instruction set), the coprocessor means x87 FPU. +d8: ESC {FPU} +d9: ESC {FPU} +da: ESC {FPU} +db: ESC {FPU} +dc: ESC {FPU} +dd: ESC {FPU} +de: ESC {FPU} +df: ESC {FPU} # 0xe0 - 0xef # Note: "forced64" is Intel CPU behavior: they ignore 0x66 prefix # in 64-bit mode. AMD CPUs accept 0x66 prefix, it causes RIP truncation @@ -339,7 +345,7 @@ AVXcode: 1 0c: # AMD's prefetch group. Intel supports prefetchw(/1) only. 0d: GrpP -0e: FEMMS +0e: FEMMS {FPU} # 3DNow! uses the last imm byte as opcode extension. 0f: 3DNow! Pq,Qq,Ib # 0x0f 0x10-0x1f @@ -462,7 +468,7 @@ AVXcode: 1 75: pcmpeqw Pq,Qq | vpcmpeqw Vx,Hx,Wx (66),(v1) 76: pcmpeqd Pq,Qq | vpcmpeqd Vx,Hx,Wx (66),(v1) # Note: Remove (v), because vzeroall and vzeroupper becomes emms without VEX. -77: emms | vzeroupper | vzeroall +77: emms {FPU} | vzeroupper | vzeroall 78: VMREAD Ey,Gy | vcvttps2udq/pd2udq Vx,Wpd (evo) | vcvttsd2usi Gv,Wx (F2),(ev) | vcvttss2usi Gv,Wx (F3),(ev) | vcvttps2uqq/pd2uqq Vx,Wx (66),(ev) 79: VMWRITE Gy,Ey | vcvtps2udq/pd2udq Vx,Wpd (evo) | vcvtsd2usi Gv,Wx (F2),(ev) | vcvtss2usi Gv,Wx (F3),(ev) | vcvtps2uqq/pd2uqq Vx,Wx (66),(ev) 7a: vcvtudq2pd/uqq2pd Vpd,Wx (F3),(ev) | vcvtudq2ps/uqq2ps Vpd,Wx (F2),(ev) | vcvttps2qq/pd2qq Vx,Wx (66),(ev) @@ -1036,10 +1042,10 @@ GrpTable: Grp14 EndTable GrpTable: Grp15 -0: fxsave | RDFSBASE Ry (F3),(11B) -1: fxstor | RDGSBASE Ry (F3),(11B) -2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B) -3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B) +0: fxsave {FPU} | RDFSBASE Ry (F3),(11B) +1: fxrstor {FPU} | RDGSBASE Ry (F3),(11B) +2: ldmxcsr {FPU} | vldmxcsr Md (v1),{FPU} | WRFSBASE Ry (F3),(11B) +3: stmxcsr {FPU} | vstmxcsr Md (v1),{FPU} | WRGSBASE Ry (F3),(11B) 4: XSAVE | ptwrite Ey (F3),(11B) 5: XRSTOR | lfence (11B) | INCSSPD/Q Ry (F3),(11B) 6: XSAVEOPT | clwb (66) | mfence (11B) | TPAUSE Rd (66),(11B) | UMONITOR Rv (F3),(11B) | UMWAIT Rd (F2),(11B) | CLRSSBSY Mq (F3) diff --git a/arch/x86/tools/gen-insn-attr-x86.awk b/arch/x86/tools/gen-insn-attr-x86.awk index a42015b305f4..d8a9dae42c3d 100644 --- a/arch/x86/tools/gen-insn-attr-x86.awk +++ b/arch/x86/tools/gen-insn-attr-x86.awk @@ -44,7 +44,7 @@ BEGIN { delete atable opnd_expr = "^[A-Za-z/]" - ext_expr = "^\\(" + ext_expr = "^(\\(|\\{)" sep_expr = "^\\|$" group_expr = "^Grp[0-9A-Za-z]+" @@ -65,7 +65,10 @@ BEGIN { modrm_expr = "^([CDEGMNPQRSUVW/][a-z]+|NTA|T[012])" force64_expr = "\\([df]64\\)" rex_expr = "^REX(\\.[XRWB]+)*" - fpu_expr = "^ESC" # TODO + x87_expr = "^ESC" + + fpureg_expr = "^[HLNPQUVW][a-z]+" # MMX/SSE register operands + fpu_expr = "\\{FPU\\}" lprefix1_expr = "\\((66|!F3)\\)" lprefix2_expr = "\\(F3\\)" @@ -236,10 +239,11 @@ function add_flags(old,new) { } # convert operands to flags. -function convert_operands(count,opnd, i,j,imm,mod) +function convert_operands(count,opnd, i,j,imm,mod,fpu) { imm = null mod = null + fpu = null for (j = 1; j <= count; j++) { i = opnd[j] if (match(i, imm_expr) == 1) { @@ -253,7 +257,12 @@ function convert_operands(count,opnd, i,j,imm,mod) imm = imm_flag[i] } else if (match(i, modrm_expr)) mod = "INAT_MODRM" + if (match(i, fpureg_expr) == 1) { + fpu = "INAT_FPU" + } } + if (fpu) + imm = add_flags(imm, fpu) return add_flags(imm, mod) } @@ -283,6 +292,10 @@ function convert_operands(count,opnd, i,j,imm,mod) variant = null # converts i = 2 + lpfpu[0] = 0 + lpfpu[1] = 0 + lpfpu[2] = 0 + lpfpu[3] = 0 while (i <= NF) { opcode = $(i++) delete opnds @@ -318,10 +331,14 @@ function convert_operands(count,opnd, i,j,imm,mod) if (match(opcode, rex_expr)) flags = add_flags(flags, "INAT_MAKE_PREFIX(INAT_PFX_REX)") - # check coprocessor escape : TODO - if (match(opcode, fpu_expr)) + # x87 escape opcode needs MODRM + if (match(ext, x87_expr)) flags = add_flags(flags, "INAT_MODRM") + # check FPU/MMX/SSE superscripts + if (match(ext, fpu_expr)) + flags = add_flags(flags, "INAT_FPU") + # check VEX codes if (match(ext, evexonly_expr)) flags = add_flags(flags, "INAT_VEXOK | INAT_EVEXONLY") @@ -336,22 +353,49 @@ function convert_operands(count,opnd, i,j,imm,mod) semantic_error("Unknown prefix: " opcode) flags = add_flags(flags, "INAT_MAKE_PREFIX(" prefix_num[opcode] ")") } - if (length(flags) == 0) - continue + # check if last prefix if (match(ext, lprefix1_expr)) { + if (lpfpu[1] == 0 && flags !~ "INAT_FPU") + lpfpu[1] = 1 + else if (lpfpu[1] != 0 && flags ~ "INAT_FPU") + flags = add_flags(flags, "INAT_FPUIFVEX") + if (length(flags) == 0) + continue; lptable1[idx] = add_flags(lptable1[idx],flags) variant = "INAT_VARIANT" } if (match(ext, lprefix2_expr)) { + if (lpfpu[2] == 0 && flags !~ "INAT_FPU") + lpfpu[2] = 1 + else if (lpfpu[2] != 0 && flags ~ "INAT_FPU") + flags = add_flags(flags, "INAT_FPUIFVEX") + if (length(flags) == 0) + continue; lptable2[idx] = add_flags(lptable2[idx],flags) variant = "INAT_VARIANT" } if (match(ext, lprefix3_expr)) { + if (lpfpu[3] == 0 && flags !~ "INAT_FPU") + lpfpu[3] = 1 + else if (lpfpu[3] != 0 && flags ~ "INAT_FPU") + flags = add_flags(flags, "INAT_FPUIFVEX") + if (length(flags) == 0) + continue; lptable3[idx] = add_flags(lptable3[idx],flags) variant = "INAT_VARIANT" } if (!match(ext, lprefix_expr)){ + if (lpfpu[0] == 0 && flags !~ "INAT_FPU") { + lpfpu[0] = 1 + lpfpu[1] = 1 + lpfpu[2] = 1 + lpfpu[3] = 1 + } + else if (lpfpu[0] != 0 && flags ~ "INAT_FPU") + flags = add_flags(flags, "INAT_FPUIFVEX") + if (length(flags) == 0) + continue; table[idx] = add_flags(table[idx],flags) } } diff --git a/tools/arch/x86/include/asm/inat.h b/tools/arch/x86/include/asm/inat.h index 877827b7c2c3..2e6a05290efd 100644 --- a/tools/arch/x86/include/asm/inat.h +++ b/tools/arch/x86/include/asm/inat.h @@ -77,6 +77,8 @@ #define INAT_VEXOK (1 << (INAT_FLAG_OFFS + 5)) #define INAT_VEXONLY (1 << (INAT_FLAG_OFFS + 6)) #define INAT_EVEXONLY (1 << (INAT_FLAG_OFFS + 7)) +#define INAT_FPU (1 << (INAT_FLAG_OFFS + 8)) +#define INAT_FPUIFVEX (1 << (INAT_FLAG_OFFS + 9)) /* Attribute making macros for attribute tables */ #define INAT_MAKE_PREFIX(pfx) (pfx << INAT_PFX_OFFS) #define INAT_MAKE_ESCAPE(esc) (esc << INAT_ESC_OFFS) @@ -227,4 +229,9 @@ static inline int inat_must_evex(insn_attr_t attr) { return attr & INAT_EVEXONLY; } + +static inline int inat_is_fpu(insn_attr_t attr) +{ + return attr & INAT_FPU; +} #endif diff --git a/tools/arch/x86/include/asm/insn.h b/tools/arch/x86/include/asm/insn.h index 568854b14d0a..d9f6bd9059c1 100644 --- a/tools/arch/x86/include/asm/insn.h +++ b/tools/arch/x86/include/asm/insn.h @@ -129,6 +129,18 @@ static inline int insn_is_evex(struct insn *insn) return (insn->vex_prefix.nbytes == 4); } +static inline int insn_is_fpu(struct insn *insn) +{ + if (!insn->opcode.got) + insn_get_opcode(insn); + if (inat_is_fpu(insn->attr)) { + if (insn->attr & INAT_FPUIFVEX) + return insn_is_avx(insn); + return 1; + } + return 0; +} + static inline int insn_has_emulate_prefix(struct insn *insn) { return !!insn->emulate_prefix_size; diff --git a/tools/arch/x86/lib/x86-opcode-map.txt b/tools/arch/x86/lib/x86-opcode-map.txt index ec31f5b60323..0adf11cbd3a8 100644 --- a/tools/arch/x86/lib/x86-opcode-map.txt +++ b/tools/arch/x86/lib/x86-opcode-map.txt @@ -33,6 +33,10 @@ # - (F2): the last prefix is 0xF2 # - (!F3) : the last prefix is not 0xF3 (including non-last prefix case) # - (66&F2): Both 0x66 and 0xF2 prefixes are specified. +# +# Optional Superscripts +# - {FPU}: this mnemonic doesn't have FPU/MMX/SSE operands but access those +# registers. Table: one byte opcode Referrer: @@ -202,7 +206,7 @@ AVXcode: 98: CBW/CWDE/CDQE 99: CWD/CDQ/CQO 9a: CALLF Ap (i64) -9b: FWAIT/WAIT +9b: FWAIT/WAIT {FPU} 9c: PUSHF/D/Q Fv (d64) 9d: POPF/D/Q Fv (d64) 9e: SAHF @@ -269,14 +273,16 @@ d4: AAM Ib (i64) d5: AAD Ib (i64) d6: d7: XLAT/XLATB -d8: ESC -d9: ESC -da: ESC -db: ESC -dc: ESC -dd: ESC -de: ESC -df: ESC +# Intel SDM Appendix A Opcode Map shows these opcode are ESC (Escape to +# coprocessor instruction set), the coprocessor means x87 FPU. +d8: ESC {FPU} +d9: ESC {FPU} +da: ESC {FPU} +db: ESC {FPU} +dc: ESC {FPU} +dd: ESC {FPU} +de: ESC {FPU} +df: ESC {FPU} # 0xe0 - 0xef # Note: "forced64" is Intel CPU behavior: they ignore 0x66 prefix # in 64-bit mode. AMD CPUs accept 0x66 prefix, it causes RIP truncation @@ -339,7 +345,7 @@ AVXcode: 1 0c: # AMD's prefetch group. Intel supports prefetchw(/1) only. 0d: GrpP -0e: FEMMS +0e: FEMMS {FPU} # 3DNow! uses the last imm byte as opcode extension. 0f: 3DNow! Pq,Qq,Ib # 0x0f 0x10-0x1f @@ -462,7 +468,7 @@ AVXcode: 1 75: pcmpeqw Pq,Qq | vpcmpeqw Vx,Hx,Wx (66),(v1) 76: pcmpeqd Pq,Qq | vpcmpeqd Vx,Hx,Wx (66),(v1) # Note: Remove (v), because vzeroall and vzeroupper becomes emms without VEX. -77: emms | vzeroupper | vzeroall +77: emms {FPU} | vzeroupper | vzeroall 78: VMREAD Ey,Gy | vcvttps2udq/pd2udq Vx,Wpd (evo) | vcvttsd2usi Gv,Wx (F2),(ev) | vcvttss2usi Gv,Wx (F3),(ev) | vcvttps2uqq/pd2uqq Vx,Wx (66),(ev) 79: VMWRITE Gy,Ey | vcvtps2udq/pd2udq Vx,Wpd (evo) | vcvtsd2usi Gv,Wx (F2),(ev) | vcvtss2usi Gv,Wx (F3),(ev) | vcvtps2uqq/pd2uqq Vx,Wx (66),(ev) 7a: vcvtudq2pd/uqq2pd Vpd,Wx (F3),(ev) | vcvtudq2ps/uqq2ps Vpd,Wx (F2),(ev) | vcvttps2qq/pd2qq Vx,Wx (66),(ev) @@ -1036,10 +1042,10 @@ GrpTable: Grp14 EndTable GrpTable: Grp15 -0: fxsave | RDFSBASE Ry (F3),(11B) -1: fxstor | RDGSBASE Ry (F3),(11B) -2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B) -3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B) +0: fxsave {FPU} | RDFSBASE Ry (F3),(11B) +1: fxrstor {FPU} | RDGSBASE Ry (F3),(11B) +2: ldmxcsr {FPU} | vldmxcsr Md (v1),{FPU} | WRFSBASE Ry (F3),(11B) +3: stmxcsr {FPU} | vstmxcsr Md (v1),{FPU} | WRGSBASE Ry (F3),(11B) 4: XSAVE | ptwrite Ey (F3),(11B) 5: XRSTOR | lfence (11B) | INCSSPD/Q Ry (F3),(11B) 6: XSAVEOPT | clwb (66) | mfence (11B) | TPAUSE Rd (66),(11B) | UMONITOR Rv (F3),(11B) | UMWAIT Rd (F2),(11B) | CLRSSBSY Mq (F3) diff --git a/tools/arch/x86/tools/gen-insn-attr-x86.awk b/tools/arch/x86/tools/gen-insn-attr-x86.awk index a42015b305f4..d8a9dae42c3d 100644 --- a/tools/arch/x86/tools/gen-insn-attr-x86.awk +++ b/tools/arch/x86/tools/gen-insn-attr-x86.awk @@ -44,7 +44,7 @@ BEGIN { delete atable opnd_expr = "^[A-Za-z/]" - ext_expr = "^\\(" + ext_expr = "^(\\(|\\{)" sep_expr = "^\\|$" group_expr = "^Grp[0-9A-Za-z]+" @@ -65,7 +65,10 @@ BEGIN { modrm_expr = "^([CDEGMNPQRSUVW/][a-z]+|NTA|T[012])" force64_expr = "\\([df]64\\)" rex_expr = "^REX(\\.[XRWB]+)*" - fpu_expr = "^ESC" # TODO + x87_expr = "^ESC" + + fpureg_expr = "^[HLNPQUVW][a-z]+" # MMX/SSE register operands + fpu_expr = "\\{FPU\\}" lprefix1_expr = "\\((66|!F3)\\)" lprefix2_expr = "\\(F3\\)" @@ -236,10 +239,11 @@ function add_flags(old,new) { } # convert operands to flags. -function convert_operands(count,opnd, i,j,imm,mod) +function convert_operands(count,opnd, i,j,imm,mod,fpu) { imm = null mod = null + fpu = null for (j = 1; j <= count; j++) { i = opnd[j] if (match(i, imm_expr) == 1) { @@ -253,7 +257,12 @@ function convert_operands(count,opnd, i,j,imm,mod) imm = imm_flag[i] } else if (match(i, modrm_expr)) mod = "INAT_MODRM" + if (match(i, fpureg_expr) == 1) { + fpu = "INAT_FPU" + } } + if (fpu) + imm = add_flags(imm, fpu) return add_flags(imm, mod) } @@ -283,6 +292,10 @@ function convert_operands(count,opnd, i,j,imm,mod) variant = null # converts i = 2 + lpfpu[0] = 0 + lpfpu[1] = 0 + lpfpu[2] = 0 + lpfpu[3] = 0 while (i <= NF) { opcode = $(i++) delete opnds @@ -318,10 +331,14 @@ function convert_operands(count,opnd, i,j,imm,mod) if (match(opcode, rex_expr)) flags = add_flags(flags, "INAT_MAKE_PREFIX(INAT_PFX_REX)") - # check coprocessor escape : TODO - if (match(opcode, fpu_expr)) + # x87 escape opcode needs MODRM + if (match(ext, x87_expr)) flags = add_flags(flags, "INAT_MODRM") + # check FPU/MMX/SSE superscripts + if (match(ext, fpu_expr)) + flags = add_flags(flags, "INAT_FPU") + # check VEX codes if (match(ext, evexonly_expr)) flags = add_flags(flags, "INAT_VEXOK | INAT_EVEXONLY") @@ -336,22 +353,49 @@ function convert_operands(count,opnd, i,j,imm,mod) semantic_error("Unknown prefix: " opcode) flags = add_flags(flags, "INAT_MAKE_PREFIX(" prefix_num[opcode] ")") } - if (length(flags) == 0) - continue + # check if last prefix if (match(ext, lprefix1_expr)) { + if (lpfpu[1] == 0 && flags !~ "INAT_FPU") + lpfpu[1] = 1 + else if (lpfpu[1] != 0 && flags ~ "INAT_FPU") + flags = add_flags(flags, "INAT_FPUIFVEX") + if (length(flags) == 0) + continue; lptable1[idx] = add_flags(lptable1[idx],flags) variant = "INAT_VARIANT" } if (match(ext, lprefix2_expr)) { + if (lpfpu[2] == 0 && flags !~ "INAT_FPU") + lpfpu[2] = 1 + else if (lpfpu[2] != 0 && flags ~ "INAT_FPU") + flags = add_flags(flags, "INAT_FPUIFVEX") + if (length(flags) == 0) + continue; lptable2[idx] = add_flags(lptable2[idx],flags) variant = "INAT_VARIANT" } if (match(ext, lprefix3_expr)) { + if (lpfpu[3] == 0 && flags !~ "INAT_FPU") + lpfpu[3] = 1 + else if (lpfpu[3] != 0 && flags ~ "INAT_FPU") + flags = add_flags(flags, "INAT_FPUIFVEX") + if (length(flags) == 0) + continue; lptable3[idx] = add_flags(lptable3[idx],flags) variant = "INAT_VARIANT" } if (!match(ext, lprefix_expr)){ + if (lpfpu[0] == 0 && flags !~ "INAT_FPU") { + lpfpu[0] = 1 + lpfpu[1] = 1 + lpfpu[2] = 1 + lpfpu[3] = 1 + } + else if (lpfpu[0] != 0 && flags ~ "INAT_FPU") + flags = add_flags(flags, "INAT_FPUIFVEX") + if (length(flags) == 0) + continue; table[idx] = add_flags(table[idx],flags) } } _______________________________________________ amd-gfx mailing list amd-gfx@xxxxxxxxxxxxxxxxxxxxx https://lists.freedesktop.org/mailman/listinfo/amd-gfx