Add insn_is_fpu(insn) which tells that the insn is
whether touch the FPU/SSE/MMX register or the instruction
of FP coprocessor.

Signed-off-by: Masami Hiramatsu <mhira...@kernel.org>
---
 Changes in v3:
 - Add {FPU} to FWAIT/WAIT and FEMMS.
 - Split INAT_FPU and INAT_MODRM.
 - Remove a blank line typo.
---
 arch/x86/include/asm/inat.h                |    7 +++
 arch/x86/include/asm/insn.h                |   12 ++++++
 arch/x86/lib/x86-opcode-map.txt            |   36 ++++++++++-------
 arch/x86/tools/gen-insn-attr-x86.awk       |   58 +++++++++++++++++++++++++---
 tools/arch/x86/include/asm/inat.h          |    7 +++
 tools/arch/x86/include/asm/insn.h          |   12 ++++++
 tools/arch/x86/lib/x86-opcode-map.txt      |   36 ++++++++++-------
 tools/arch/x86/tools/gen-insn-attr-x86.awk |   58 +++++++++++++++++++++++++---
 8 files changed, 182 insertions(+), 44 deletions(-)

diff --git a/arch/x86/include/asm/inat.h b/arch/x86/include/asm/inat.h
index 4cf2ad521f65..ffce45178c08 100644
--- a/arch/x86/include/asm/inat.h
+++ b/arch/x86/include/asm/inat.h
@@ -77,6 +77,8 @@
 #define INAT_VEXOK     (1 << (INAT_FLAG_OFFS + 5))
 #define INAT_VEXONLY   (1 << (INAT_FLAG_OFFS + 6))
 #define INAT_EVEXONLY  (1 << (INAT_FLAG_OFFS + 7))
+#define INAT_FPU       (1 << (INAT_FLAG_OFFS + 8))
+#define INAT_FPUIFVEX  (1 << (INAT_FLAG_OFFS + 9))
 /* Attribute making macros for attribute tables */
 #define INAT_MAKE_PREFIX(pfx)  (pfx << INAT_PFX_OFFS)
 #define INAT_MAKE_ESCAPE(esc)  (esc << INAT_ESC_OFFS)
@@ -227,4 +229,9 @@ static inline int inat_must_evex(insn_attr_t attr)
 {
        return attr & INAT_EVEXONLY;
 }
+
+static inline int inat_is_fpu(insn_attr_t attr)
+{
+       return attr & INAT_FPU;
+}
 #endif
diff --git a/arch/x86/include/asm/insn.h b/arch/x86/include/asm/insn.h
index 5c1ae3eff9d4..1752c54d2103 100644
--- a/arch/x86/include/asm/insn.h
+++ b/arch/x86/include/asm/insn.h
@@ -129,6 +129,18 @@ static inline int insn_is_evex(struct insn *insn)
        return (insn->vex_prefix.nbytes == 4);
 }
 
+static inline int insn_is_fpu(struct insn *insn)
+{
+       if (!insn->opcode.got)
+               insn_get_opcode(insn);
+       if (inat_is_fpu(insn->attr)) {
+               if (insn->attr & INAT_FPUIFVEX)
+                       return insn_is_avx(insn);
+               return 1;
+       }
+       return 0;
+}
+
 static inline int insn_has_emulate_prefix(struct insn *insn)
 {
        return !!insn->emulate_prefix_size;
diff --git a/arch/x86/lib/x86-opcode-map.txt b/arch/x86/lib/x86-opcode-map.txt
index ec31f5b60323..0adf11cbd3a8 100644
--- a/arch/x86/lib/x86-opcode-map.txt
+++ b/arch/x86/lib/x86-opcode-map.txt
@@ -33,6 +33,10 @@
 #  - (F2): the last prefix is 0xF2
 #  - (!F3) : the last prefix is not 0xF3 (including non-last prefix case)
 #  - (66&F2): Both 0x66 and 0xF2 prefixes are specified.
+#
+# Optional Superscripts
+#  - {FPU}: this mnemonic doesn't have FPU/MMX/SSE operands but access those
+#           registers.
 
 Table: one byte opcode
 Referrer:
@@ -202,7 +206,7 @@ AVXcode:
 98: CBW/CWDE/CDQE
 99: CWD/CDQ/CQO
 9a: CALLF Ap (i64)
-9b: FWAIT/WAIT
+9b: FWAIT/WAIT {FPU}
 9c: PUSHF/D/Q Fv (d64)
 9d: POPF/D/Q Fv (d64)
 9e: SAHF
@@ -269,14 +273,16 @@ d4: AAM Ib (i64)
 d5: AAD Ib (i64)
 d6:
 d7: XLAT/XLATB
-d8: ESC
-d9: ESC
-da: ESC
-db: ESC
-dc: ESC
-dd: ESC
-de: ESC
-df: ESC
+# Intel SDM Appendix A Opcode Map shows these opcode are ESC (Escape to
+# coprocessor instruction set), the coprocessor means x87 FPU.
+d8: ESC {FPU}
+d9: ESC {FPU}
+da: ESC {FPU}
+db: ESC {FPU}
+dc: ESC {FPU}
+dd: ESC {FPU}
+de: ESC {FPU}
+df: ESC {FPU}
 # 0xe0 - 0xef
 # Note: "forced64" is Intel CPU behavior: they ignore 0x66 prefix
 # in 64-bit mode. AMD CPUs accept 0x66 prefix, it causes RIP truncation
@@ -339,7 +345,7 @@ AVXcode: 1
 0c:
 # AMD's prefetch group. Intel supports prefetchw(/1) only.
 0d: GrpP
-0e: FEMMS
+0e: FEMMS {FPU}
 # 3DNow! uses the last imm byte as opcode extension.
 0f: 3DNow! Pq,Qq,Ib
 # 0x0f 0x10-0x1f
@@ -462,7 +468,7 @@ AVXcode: 1
 75: pcmpeqw Pq,Qq | vpcmpeqw Vx,Hx,Wx (66),(v1)
 76: pcmpeqd Pq,Qq | vpcmpeqd Vx,Hx,Wx (66),(v1)
 # Note: Remove (v), because vzeroall and vzeroupper becomes emms without VEX.
-77: emms | vzeroupper | vzeroall
+77: emms {FPU} | vzeroupper | vzeroall
 78: VMREAD Ey,Gy | vcvttps2udq/pd2udq Vx,Wpd (evo) | vcvttsd2usi Gv,Wx 
(F2),(ev) | vcvttss2usi Gv,Wx (F3),(ev) | vcvttps2uqq/pd2uqq Vx,Wx (66),(ev)
 79: VMWRITE Gy,Ey | vcvtps2udq/pd2udq Vx,Wpd (evo) | vcvtsd2usi Gv,Wx 
(F2),(ev) | vcvtss2usi Gv,Wx (F3),(ev) | vcvtps2uqq/pd2uqq Vx,Wx (66),(ev)
 7a: vcvtudq2pd/uqq2pd Vpd,Wx (F3),(ev) | vcvtudq2ps/uqq2ps Vpd,Wx (F2),(ev) | 
vcvttps2qq/pd2qq Vx,Wx (66),(ev)
@@ -1036,10 +1042,10 @@ GrpTable: Grp14
 EndTable
 
 GrpTable: Grp15
-0: fxsave | RDFSBASE Ry (F3),(11B)
-1: fxstor | RDGSBASE Ry (F3),(11B)
-2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B)
-3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B)
+0: fxsave {FPU} | RDFSBASE Ry (F3),(11B)
+1: fxrstor {FPU} | RDGSBASE Ry (F3),(11B)
+2: ldmxcsr {FPU} | vldmxcsr Md (v1),{FPU} | WRFSBASE Ry (F3),(11B)
+3: stmxcsr {FPU} | vstmxcsr Md (v1),{FPU} | WRGSBASE Ry (F3),(11B)
 4: XSAVE | ptwrite Ey (F3),(11B)
 5: XRSTOR | lfence (11B) | INCSSPD/Q Ry (F3),(11B)
 6: XSAVEOPT | clwb (66) | mfence (11B) | TPAUSE Rd (66),(11B) | UMONITOR Rv 
(F3),(11B) | UMWAIT Rd (F2),(11B) | CLRSSBSY Mq (F3)
diff --git a/arch/x86/tools/gen-insn-attr-x86.awk 
b/arch/x86/tools/gen-insn-attr-x86.awk
index a42015b305f4..d8a9dae42c3d 100644
--- a/arch/x86/tools/gen-insn-attr-x86.awk
+++ b/arch/x86/tools/gen-insn-attr-x86.awk
@@ -44,7 +44,7 @@ BEGIN {
        delete atable
 
        opnd_expr = "^[A-Za-z/]"
-       ext_expr = "^\\("
+       ext_expr = "^(\\(|\\{)"
        sep_expr = "^\\|$"
        group_expr = "^Grp[0-9A-Za-z]+"
 
@@ -65,7 +65,10 @@ BEGIN {
        modrm_expr = "^([CDEGMNPQRSUVW/][a-z]+|NTA|T[012])"
        force64_expr = "\\([df]64\\)"
        rex_expr = "^REX(\\.[XRWB]+)*"
-       fpu_expr = "^ESC" # TODO
+       x87_expr = "^ESC"
+
+       fpureg_expr = "^[HLNPQUVW][a-z]+" # MMX/SSE register operands
+       fpu_expr = "\\{FPU\\}"
 
        lprefix1_expr = "\\((66|!F3)\\)"
        lprefix2_expr = "\\(F3\\)"
@@ -236,10 +239,11 @@ function add_flags(old,new) {
 }
 
 # convert operands to flags.
-function convert_operands(count,opnd,       i,j,imm,mod)
+function convert_operands(count,opnd,       i,j,imm,mod,fpu)
 {
        imm = null
        mod = null
+       fpu = null
        for (j = 1; j <= count; j++) {
                i = opnd[j]
                if (match(i, imm_expr) == 1) {
@@ -253,7 +257,12 @@ function convert_operands(count,opnd,       i,j,imm,mod)
                                imm = imm_flag[i]
                } else if (match(i, modrm_expr))
                        mod = "INAT_MODRM"
+               if (match(i, fpureg_expr) == 1) {
+                       fpu = "INAT_FPU"
+               }
        }
+       if (fpu)
+               imm = add_flags(imm, fpu)
        return add_flags(imm, mod)
 }
 
@@ -283,6 +292,10 @@ function convert_operands(count,opnd,       i,j,imm,mod)
        variant = null
        # converts
        i = 2
+       lpfpu[0] = 0
+       lpfpu[1] = 0
+       lpfpu[2] = 0
+       lpfpu[3] = 0
        while (i <= NF) {
                opcode = $(i++)
                delete opnds
@@ -318,10 +331,14 @@ function convert_operands(count,opnd,       i,j,imm,mod)
                if (match(opcode, rex_expr))
                        flags = add_flags(flags, 
"INAT_MAKE_PREFIX(INAT_PFX_REX)")
 
-               # check coprocessor escape : TODO
-               if (match(opcode, fpu_expr))
+               # x87 escape opcode needs MODRM
+               if (match(ext, x87_expr))
                        flags = add_flags(flags, "INAT_MODRM")
 
+               # check FPU/MMX/SSE superscripts
+               if (match(ext, fpu_expr))
+                       flags = add_flags(flags, "INAT_FPU")
+
                # check VEX codes
                if (match(ext, evexonly_expr))
                        flags = add_flags(flags, "INAT_VEXOK | INAT_EVEXONLY")
@@ -336,22 +353,49 @@ function convert_operands(count,opnd,       i,j,imm,mod)
                                semantic_error("Unknown prefix: " opcode)
                        flags = add_flags(flags, "INAT_MAKE_PREFIX(" 
prefix_num[opcode] ")")
                }
-               if (length(flags) == 0)
-                       continue
+
                # check if last prefix
                if (match(ext, lprefix1_expr)) {
+                       if (lpfpu[1] == 0 && flags !~ "INAT_FPU")
+                               lpfpu[1] = 1
+                       else if (lpfpu[1] != 0 && flags ~ "INAT_FPU")
+                               flags = add_flags(flags, "INAT_FPUIFVEX")
+                       if (length(flags) == 0)
+                               continue;
                        lptable1[idx] = add_flags(lptable1[idx],flags)
                        variant = "INAT_VARIANT"
                }
                if (match(ext, lprefix2_expr)) {
+                       if (lpfpu[2] == 0 && flags !~ "INAT_FPU")
+                               lpfpu[2] = 1
+                       else if (lpfpu[2] != 0 && flags ~ "INAT_FPU")
+                               flags = add_flags(flags, "INAT_FPUIFVEX")
+                       if (length(flags) == 0)
+                               continue;
                        lptable2[idx] = add_flags(lptable2[idx],flags)
                        variant = "INAT_VARIANT"
                }
                if (match(ext, lprefix3_expr)) {
+                       if (lpfpu[3] == 0 && flags !~ "INAT_FPU")
+                               lpfpu[3] = 1
+                       else if (lpfpu[3] != 0 && flags ~ "INAT_FPU")
+                               flags = add_flags(flags, "INAT_FPUIFVEX")
+                       if (length(flags) == 0)
+                               continue;
                        lptable3[idx] = add_flags(lptable3[idx],flags)
                        variant = "INAT_VARIANT"
                }
                if (!match(ext, lprefix_expr)){
+                       if (lpfpu[0] == 0 && flags !~ "INAT_FPU") {
+                               lpfpu[0] = 1
+                               lpfpu[1] = 1
+                               lpfpu[2] = 1
+                               lpfpu[3] = 1
+                       }
+                       else if (lpfpu[0] != 0 && flags ~ "INAT_FPU")
+                               flags = add_flags(flags, "INAT_FPUIFVEX")
+                       if (length(flags) == 0)
+                               continue;
                        table[idx] = add_flags(table[idx],flags)
                }
        }
diff --git a/tools/arch/x86/include/asm/inat.h 
b/tools/arch/x86/include/asm/inat.h
index 877827b7c2c3..2e6a05290efd 100644
--- a/tools/arch/x86/include/asm/inat.h
+++ b/tools/arch/x86/include/asm/inat.h
@@ -77,6 +77,8 @@
 #define INAT_VEXOK     (1 << (INAT_FLAG_OFFS + 5))
 #define INAT_VEXONLY   (1 << (INAT_FLAG_OFFS + 6))
 #define INAT_EVEXONLY  (1 << (INAT_FLAG_OFFS + 7))
+#define INAT_FPU       (1 << (INAT_FLAG_OFFS + 8))
+#define INAT_FPUIFVEX  (1 << (INAT_FLAG_OFFS + 9))
 /* Attribute making macros for attribute tables */
 #define INAT_MAKE_PREFIX(pfx)  (pfx << INAT_PFX_OFFS)
 #define INAT_MAKE_ESCAPE(esc)  (esc << INAT_ESC_OFFS)
@@ -227,4 +229,9 @@ static inline int inat_must_evex(insn_attr_t attr)
 {
        return attr & INAT_EVEXONLY;
 }
+
+static inline int inat_is_fpu(insn_attr_t attr)
+{
+       return attr & INAT_FPU;
+}
 #endif
diff --git a/tools/arch/x86/include/asm/insn.h 
b/tools/arch/x86/include/asm/insn.h
index 568854b14d0a..d9f6bd9059c1 100644
--- a/tools/arch/x86/include/asm/insn.h
+++ b/tools/arch/x86/include/asm/insn.h
@@ -129,6 +129,18 @@ static inline int insn_is_evex(struct insn *insn)
        return (insn->vex_prefix.nbytes == 4);
 }
 
+static inline int insn_is_fpu(struct insn *insn)
+{
+       if (!insn->opcode.got)
+               insn_get_opcode(insn);
+       if (inat_is_fpu(insn->attr)) {
+               if (insn->attr & INAT_FPUIFVEX)
+                       return insn_is_avx(insn);
+               return 1;
+       }
+       return 0;
+}
+
 static inline int insn_has_emulate_prefix(struct insn *insn)
 {
        return !!insn->emulate_prefix_size;
diff --git a/tools/arch/x86/lib/x86-opcode-map.txt 
b/tools/arch/x86/lib/x86-opcode-map.txt
index ec31f5b60323..0adf11cbd3a8 100644
--- a/tools/arch/x86/lib/x86-opcode-map.txt
+++ b/tools/arch/x86/lib/x86-opcode-map.txt
@@ -33,6 +33,10 @@
 #  - (F2): the last prefix is 0xF2
 #  - (!F3) : the last prefix is not 0xF3 (including non-last prefix case)
 #  - (66&F2): Both 0x66 and 0xF2 prefixes are specified.
+#
+# Optional Superscripts
+#  - {FPU}: this mnemonic doesn't have FPU/MMX/SSE operands but access those
+#           registers.
 
 Table: one byte opcode
 Referrer:
@@ -202,7 +206,7 @@ AVXcode:
 98: CBW/CWDE/CDQE
 99: CWD/CDQ/CQO
 9a: CALLF Ap (i64)
-9b: FWAIT/WAIT
+9b: FWAIT/WAIT {FPU}
 9c: PUSHF/D/Q Fv (d64)
 9d: POPF/D/Q Fv (d64)
 9e: SAHF
@@ -269,14 +273,16 @@ d4: AAM Ib (i64)
 d5: AAD Ib (i64)
 d6:
 d7: XLAT/XLATB
-d8: ESC
-d9: ESC
-da: ESC
-db: ESC
-dc: ESC
-dd: ESC
-de: ESC
-df: ESC
+# Intel SDM Appendix A Opcode Map shows these opcode are ESC (Escape to
+# coprocessor instruction set), the coprocessor means x87 FPU.
+d8: ESC {FPU}
+d9: ESC {FPU}
+da: ESC {FPU}
+db: ESC {FPU}
+dc: ESC {FPU}
+dd: ESC {FPU}
+de: ESC {FPU}
+df: ESC {FPU}
 # 0xe0 - 0xef
 # Note: "forced64" is Intel CPU behavior: they ignore 0x66 prefix
 # in 64-bit mode. AMD CPUs accept 0x66 prefix, it causes RIP truncation
@@ -339,7 +345,7 @@ AVXcode: 1
 0c:
 # AMD's prefetch group. Intel supports prefetchw(/1) only.
 0d: GrpP
-0e: FEMMS
+0e: FEMMS {FPU}
 # 3DNow! uses the last imm byte as opcode extension.
 0f: 3DNow! Pq,Qq,Ib
 # 0x0f 0x10-0x1f
@@ -462,7 +468,7 @@ AVXcode: 1
 75: pcmpeqw Pq,Qq | vpcmpeqw Vx,Hx,Wx (66),(v1)
 76: pcmpeqd Pq,Qq | vpcmpeqd Vx,Hx,Wx (66),(v1)
 # Note: Remove (v), because vzeroall and vzeroupper becomes emms without VEX.
-77: emms | vzeroupper | vzeroall
+77: emms {FPU} | vzeroupper | vzeroall
 78: VMREAD Ey,Gy | vcvttps2udq/pd2udq Vx,Wpd (evo) | vcvttsd2usi Gv,Wx 
(F2),(ev) | vcvttss2usi Gv,Wx (F3),(ev) | vcvttps2uqq/pd2uqq Vx,Wx (66),(ev)
 79: VMWRITE Gy,Ey | vcvtps2udq/pd2udq Vx,Wpd (evo) | vcvtsd2usi Gv,Wx 
(F2),(ev) | vcvtss2usi Gv,Wx (F3),(ev) | vcvtps2uqq/pd2uqq Vx,Wx (66),(ev)
 7a: vcvtudq2pd/uqq2pd Vpd,Wx (F3),(ev) | vcvtudq2ps/uqq2ps Vpd,Wx (F2),(ev) | 
vcvttps2qq/pd2qq Vx,Wx (66),(ev)
@@ -1036,10 +1042,10 @@ GrpTable: Grp14
 EndTable
 
 GrpTable: Grp15
-0: fxsave | RDFSBASE Ry (F3),(11B)
-1: fxstor | RDGSBASE Ry (F3),(11B)
-2: vldmxcsr Md (v1) | WRFSBASE Ry (F3),(11B)
-3: vstmxcsr Md (v1) | WRGSBASE Ry (F3),(11B)
+0: fxsave {FPU} | RDFSBASE Ry (F3),(11B)
+1: fxrstor {FPU} | RDGSBASE Ry (F3),(11B)
+2: ldmxcsr {FPU} | vldmxcsr Md (v1),{FPU} | WRFSBASE Ry (F3),(11B)
+3: stmxcsr {FPU} | vstmxcsr Md (v1),{FPU} | WRGSBASE Ry (F3),(11B)
 4: XSAVE | ptwrite Ey (F3),(11B)
 5: XRSTOR | lfence (11B) | INCSSPD/Q Ry (F3),(11B)
 6: XSAVEOPT | clwb (66) | mfence (11B) | TPAUSE Rd (66),(11B) | UMONITOR Rv 
(F3),(11B) | UMWAIT Rd (F2),(11B) | CLRSSBSY Mq (F3)
diff --git a/tools/arch/x86/tools/gen-insn-attr-x86.awk 
b/tools/arch/x86/tools/gen-insn-attr-x86.awk
index a42015b305f4..d8a9dae42c3d 100644
--- a/tools/arch/x86/tools/gen-insn-attr-x86.awk
+++ b/tools/arch/x86/tools/gen-insn-attr-x86.awk
@@ -44,7 +44,7 @@ BEGIN {
        delete atable
 
        opnd_expr = "^[A-Za-z/]"
-       ext_expr = "^\\("
+       ext_expr = "^(\\(|\\{)"
        sep_expr = "^\\|$"
        group_expr = "^Grp[0-9A-Za-z]+"
 
@@ -65,7 +65,10 @@ BEGIN {
        modrm_expr = "^([CDEGMNPQRSUVW/][a-z]+|NTA|T[012])"
        force64_expr = "\\([df]64\\)"
        rex_expr = "^REX(\\.[XRWB]+)*"
-       fpu_expr = "^ESC" # TODO
+       x87_expr = "^ESC"
+
+       fpureg_expr = "^[HLNPQUVW][a-z]+" # MMX/SSE register operands
+       fpu_expr = "\\{FPU\\}"
 
        lprefix1_expr = "\\((66|!F3)\\)"
        lprefix2_expr = "\\(F3\\)"
@@ -236,10 +239,11 @@ function add_flags(old,new) {
 }
 
 # convert operands to flags.
-function convert_operands(count,opnd,       i,j,imm,mod)
+function convert_operands(count,opnd,       i,j,imm,mod,fpu)
 {
        imm = null
        mod = null
+       fpu = null
        for (j = 1; j <= count; j++) {
                i = opnd[j]
                if (match(i, imm_expr) == 1) {
@@ -253,7 +257,12 @@ function convert_operands(count,opnd,       i,j,imm,mod)
                                imm = imm_flag[i]
                } else if (match(i, modrm_expr))
                        mod = "INAT_MODRM"
+               if (match(i, fpureg_expr) == 1) {
+                       fpu = "INAT_FPU"
+               }
        }
+       if (fpu)
+               imm = add_flags(imm, fpu)
        return add_flags(imm, mod)
 }
 
@@ -283,6 +292,10 @@ function convert_operands(count,opnd,       i,j,imm,mod)
        variant = null
        # converts
        i = 2
+       lpfpu[0] = 0
+       lpfpu[1] = 0
+       lpfpu[2] = 0
+       lpfpu[3] = 0
        while (i <= NF) {
                opcode = $(i++)
                delete opnds
@@ -318,10 +331,14 @@ function convert_operands(count,opnd,       i,j,imm,mod)
                if (match(opcode, rex_expr))
                        flags = add_flags(flags, 
"INAT_MAKE_PREFIX(INAT_PFX_REX)")
 
-               # check coprocessor escape : TODO
-               if (match(opcode, fpu_expr))
+               # x87 escape opcode needs MODRM
+               if (match(ext, x87_expr))
                        flags = add_flags(flags, "INAT_MODRM")
 
+               # check FPU/MMX/SSE superscripts
+               if (match(ext, fpu_expr))
+                       flags = add_flags(flags, "INAT_FPU")
+
                # check VEX codes
                if (match(ext, evexonly_expr))
                        flags = add_flags(flags, "INAT_VEXOK | INAT_EVEXONLY")
@@ -336,22 +353,49 @@ function convert_operands(count,opnd,       i,j,imm,mod)
                                semantic_error("Unknown prefix: " opcode)
                        flags = add_flags(flags, "INAT_MAKE_PREFIX(" 
prefix_num[opcode] ")")
                }
-               if (length(flags) == 0)
-                       continue
+
                # check if last prefix
                if (match(ext, lprefix1_expr)) {
+                       if (lpfpu[1] == 0 && flags !~ "INAT_FPU")
+                               lpfpu[1] = 1
+                       else if (lpfpu[1] != 0 && flags ~ "INAT_FPU")
+                               flags = add_flags(flags, "INAT_FPUIFVEX")
+                       if (length(flags) == 0)
+                               continue;
                        lptable1[idx] = add_flags(lptable1[idx],flags)
                        variant = "INAT_VARIANT"
                }
                if (match(ext, lprefix2_expr)) {
+                       if (lpfpu[2] == 0 && flags !~ "INAT_FPU")
+                               lpfpu[2] = 1
+                       else if (lpfpu[2] != 0 && flags ~ "INAT_FPU")
+                               flags = add_flags(flags, "INAT_FPUIFVEX")
+                       if (length(flags) == 0)
+                               continue;
                        lptable2[idx] = add_flags(lptable2[idx],flags)
                        variant = "INAT_VARIANT"
                }
                if (match(ext, lprefix3_expr)) {
+                       if (lpfpu[3] == 0 && flags !~ "INAT_FPU")
+                               lpfpu[3] = 1
+                       else if (lpfpu[3] != 0 && flags ~ "INAT_FPU")
+                               flags = add_flags(flags, "INAT_FPUIFVEX")
+                       if (length(flags) == 0)
+                               continue;
                        lptable3[idx] = add_flags(lptable3[idx],flags)
                        variant = "INAT_VARIANT"
                }
                if (!match(ext, lprefix_expr)){
+                       if (lpfpu[0] == 0 && flags !~ "INAT_FPU") {
+                               lpfpu[0] = 1
+                               lpfpu[1] = 1
+                               lpfpu[2] = 1
+                               lpfpu[3] = 1
+                       }
+                       else if (lpfpu[0] != 0 && flags ~ "INAT_FPU")
+                               flags = add_flags(flags, "INAT_FPUIFVEX")
+                       if (length(flags) == 0)
+                               continue;
                        table[idx] = add_flags(table[idx],flags)
                }
        }

_______________________________________________
amd-gfx mailing list
amd-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/amd-gfx

Reply via email to