[PATCH, i386] Add missing entries to cpuinfo.
Uros Bizjak
ubizjak@gmail.com
Tue Oct 6 15:15:00 GMT 2015
On Tue, Oct 6, 2015 at 3:36 PM, Kirill Yukhin <kirill.yukhin@gmail.com> wrote:
> Hello,
> Patch in the bottom adds missing options to libgcc/config/i386/cpuinfo.c
> It also updates documentation.
> As far as number of entries exceeded 32, I've extended
> type of features array to INT64 (most suspicious part of the patch).
>
> Bootstrapped and regtested. `make pdf' seems to be working properly.
>
> Comments?
Er, this is on purpose. Multiversioning is intended to depend on ISA
extensions such as SSE, AVX, AES to some degree, and similar
extensions that do make a difference when used in compilation. This
was discussed some years ago, but I can't find the URL of the
discussion.
So, from the list below, I'd take only SHA. Plus fixes/additions in
the documentation and testsuite, of course.
Uros.
> gcc/
> * config/i386/i386.c (build_processor_model_struct): Replace
> array type to intDI.
> (old_builtin_cpu): Handle SHA, PREFETCHWT1, FSGSBASE, HLE,
> RTM, RDSEED, ADX, MPX, CLFLUSHOPT, PCOMMIT, CLWB, XSAVEOPT,
> XSAVEC, and XSAVES features. Update built-in expansion.
> * doc/extend.texi (ivybridge): New.
> (haswell): Ditto.
> (broadwell): Ditto.
> (skylake): Ditto.
> (skylake-avx512): Ditto.
> (aes): Ditto.
> (pclmul): Ditto.
> (fma): Ditto.
> (bmi): Ditto.
> (bmi2): Ditto.
> (avx512bw): Ditto.
> (avx512dq): Ditto.
> (avx512pf): Ditto.
> (avx512er): Ditto.
> (avx512ifma): Ditto.
> (avx512vbmi): Ditto.
> (sha): Ditto.
> (prefetchwt1): Ditto.
>
> gcc/testsuite/
> * gcc.target/i386/builtin_target.c: Check SHA, PREFETCHWT1,
> FSGSBASE, HLE, RTM, RDSEED, ADX, MPX, CLFLUSHOPT, PCOMMIT,
> CLWB, XSAVEOPT, XSAVEC, and XSAVES features.
>
> libgcc/
> * config/i386/cpuinfo.c (processor_features): Add SHA, PREFETCHWT1,
> FSGSBASE, HLE, RTM, RDSEED, ADX, MPX, CLFLUSHOPT, PCOMMIT, CLWB,
> XSAVEOPT, XSAVEC, and XSAVES features.
> (struct __processor_model): Set type of __cpu_features array to
> uint64_t.
> (get_available_features): Add new features. Reorder according
> to bit number.
>
> --
> Thanks, K
>
> commit 839916b8d017fac166f76c317bdf5c38d5d15ea4
> Author: Kirill Yukhin <kirill.yukhin@intel.com>
> Date: Tue Oct 6 16:20:09 2015 +0300
>
> Add missing entries to libgcc/config/i386/cpuinfo.c.
>
> diff --git a/gcc/config/i386/i386.c b/gcc/config/i386/i386.c
> index d59b59b..13241f2 100644
> --- a/gcc/config/i386/i386.c
> +++ b/gcc/config/i386/i386.c
> @@ -36507,10 +36507,10 @@ build_processor_model_struct (void)
> field_chain = field;
> }
>
> - /* The last field is an array of unsigned integers of size one. */
> + /* The last field is an array of unsigned long long integers of size one. */
> field = build_decl (UNKNOWN_LOCATION, FIELD_DECL,
> get_identifier (field_name[3]),
> - build_array_type (unsigned_type_node,
> + build_array_type (unsigned_intDI_type_node,
> build_index_type (size_one_node)));
> if (field_chain != NULL_TREE)
> DECL_CHAIN (field) = field_chain;
> @@ -36587,6 +36587,20 @@ fold_builtin_cpu (tree fndecl, tree *args)
> F_AVX512PF,
> F_AVX512VBMI,
> F_AVX512IFMA,
> + F_SHA,
> + F_PREFETCHWT1,
> + F_FSGSBASE,
> + F_HLE,
> + F_RTM,
> + F_RDSEED,
> + F_ADX,
> + F_MPX,
> + F_CLFLUSHOPT,
> + F_PCOMMIT,
> + F_CLWB,
> + F_XSAVEOPT,
> + F_XSAVEC,
> + F_XSAVES,
> F_MAX
> };
>
> @@ -36697,6 +36711,20 @@ fold_builtin_cpu (tree fndecl, tree *args)
> {"avx512pf",F_AVX512PF},
> {"avx512vbmi",F_AVX512VBMI},
> {"avx512ifma",F_AVX512IFMA},
> + {"prefetchwt1", F_PREFETCHWT1},
> + {"sha", F_SHA},
> + {"fsgsbase",F_FSGSBASE},
> + {"hle", F_HLE},
> + {"rtm", F_RTM},
> + {"rdseed", F_RDSEED},
> + {"adx", F_ADX},
> + {"mpx", F_MPX},
> + {"clflushopt",F_CLFLUSHOPT},
> + {"pcommit", F_PCOMMIT},
> + {"clwb", F_CLWB},
> + {"xsaveopt",F_XSAVEOPT},
> + {"xsavec", F_XSAVEC},
> + {"xsaves", F_XSAVES},
> };
>
> tree __processor_model_type = build_processor_model_struct ();
> @@ -36780,7 +36808,7 @@ fold_builtin_cpu (tree fndecl, tree *args)
> tree field;
> tree final;
>
> - unsigned int field_val = 0;
> + unsigned HOST_WIDE_INT field_val = 0;
> unsigned int NUM_ISA_NAMES
> = sizeof (isa_names_table) / sizeof (struct _isa_names_table);
>
> @@ -36806,13 +36834,13 @@ fold_builtin_cpu (tree fndecl, tree *args)
> field, NULL_TREE);
>
> /* Access the 0th element of __cpu_features array. */
> - array_elt = build4 (ARRAY_REF, unsigned_type_node, ref,
> + array_elt = build4 (ARRAY_REF, unsigned_intDI_type_node, ref,
> integer_zero_node, NULL_TREE, NULL_TREE);
>
> field_val = (1 << isa_names_table[i].feature);
> /* Return __cpu_model.__cpu_features[0] & field_val */
> - final = build2 (BIT_AND_EXPR, unsigned_type_node, array_elt,
> - build_int_cstu (unsigned_type_node, field_val));
> + final = build2 (BIT_AND_EXPR, unsigned_intDI_type_node, array_elt,
> + build_int_cstu (unsigned_intDI_type_node, field_val));
> return build1 (CONVERT_EXPR, integer_type_node, final);
> }
> gcc_unreachable ();
> diff --git a/gcc/doc/extend.texi b/gcc/doc/extend.texi
> index 2db7bb2..72ccdad 100644
> --- a/gcc/doc/extend.texi
> +++ b/gcc/doc/extend.texi
> @@ -16894,6 +16894,21 @@ Intel Core i7 Westmere CPU.
> @item sandybridge
> Intel Core i7 Sandy Bridge CPU.
>
> +@item ivybridge
> +Intel Core i7 Ivy Bridge CPU.
> +
> +@item haswell
> +Intel Core i7 Haswell CPU.
> +
> +@item broadwell
> +Intel Core i7 Broadwell CPU.
> +
> +@item skylake
> +Intel Core i7 Skylake CPU.
> +
> +@item skylake-avx512
> +Intel Core i7 Skylake CPU with AVX-512 extensions.
> +
> @item amd
> AMD CPU.
>
> @@ -16968,12 +16983,40 @@ SSSE3 instructions.
> SSE4.1 instructions.
> @item sse4.2
> SSE4.2 instructions.
> +@item aes
> +AES instructions.
> +@item pclmul
> +PCLMUL instructions.
> @item avx
> AVX instructions.
> +@item fma
> +FMA instructions.
> @item avx2
> AVX2 instructions.
> +@item bmi
> +BMI instructions.
> +@item bmi2
> +BMI2 instructions.
> @item avx512f
> AVX512F instructions.
> +@item avx512bw
> +AVX512BW instructions.
> +@item avx512dq
> +AVX512DQ instructions.
> +@item avx512cd
> +AVX512CD instructions.
> +@item avx512pf
> +AVX512PF instructions.
> +@item avx512er
> +AVX512ER instructions.
> +@item avx512ifma
> +AVX512IFMA instructions.
> +@item avx512vbmi
> +AVX512VBMI instructions.
> +@item sha
> +SHA instructions.
> +@item prefetchwt1
> +PREFETCHWT1 instructions.
> @end table
>
> Here is an example:
> diff --git a/gcc/testsuite/gcc.target/i386/builtin_target.c b/gcc/testsuite/gcc.target/i386/builtin_target.c
> index dd31108..235c7b5 100644
> --- a/gcc/testsuite/gcc.target/i386/builtin_target.c
> +++ b/gcc/testsuite/gcc.target/i386/builtin_target.c
> @@ -173,10 +173,6 @@ check_features (unsigned int ecx, unsigned int edx,
> assert (__builtin_cpu_supports ("sse2"));
> if (ecx & bit_POPCNT)
> assert (__builtin_cpu_supports ("popcnt"));
> - if (ecx & bit_AES)
> - assert (__builtin_cpu_supports ("aes"));
> - if (ecx & bit_PCLMUL)
> - assert (__builtin_cpu_supports ("pclmul"));
> if (ecx & bit_SSE3)
> assert (__builtin_cpu_supports ("sse3"));
> if (ecx & bit_SSSE3)
> @@ -193,26 +189,61 @@ check_features (unsigned int ecx, unsigned int edx,
> {
> unsigned int eax, ebx, ecx, edx;
> __cpuid_count (7, 0, eax, ebx, ecx, edx);
> + if (ebx & bit_FSGSBASE)
> + assert (__builtin_cpu_supports ("fsgsbase"));
> + if (ebx & bit_BMI)
> + assert (__builtin_cpu_supports ("bmi"));
> + if (ebx & bit_HLE)
> + assert (__builtin_cpu_supports ("hle"));
> if (ebx & bit_AVX2)
> assert (__builtin_cpu_supports ("avx2"));
> + if (ebx & bit_BMI2)
> + assert (__builtin_cpu_supports ("bmi2"));
> + if (ebx & bit_RTM)
> + assert (__builtin_cpu_supports ("rtm"));
> + if (ebx & bit_MPX)
> + assert (__builtin_cpu_supports ("mpx"));
> if (ebx & bit_AVX512F)
> assert (__builtin_cpu_supports ("avx512f"));
> - if (ebx & bit_AVX512VL)
> - assert (__builtin_cpu_supports ("avx512vl"));
> - if (ebx & bit_AVX512CD)
> - assert (__builtin_cpu_supports ("avx512cd"));
> + if (ebx & bit_AVX512DQ)
> + assert (__builtin_cpu_supports ("avx512dq"));
> + if (ebx & bit_RDSEED)
> + assert (__builtin_cpu_supports ("rdseed"));
> + if (ebx & bit_ADX)
> + assert (__builtin_cpu_supports ("adx"));
> + if (ebx & bit_AVX512IFMA)
> + assert (__builtin_cpu_supports ("avx512ifma"));
> + if (ebx & bit_PCOMMIT)
> + assert (__builtin_cpu_supports ("pcommit"));
> + if (ebx & bit_CLFLUSHOPT)
> + assert (__builtin_cpu_supports ("clflushopt"));
> + if (ebx & bit_CLWB)
> + assert (__builtin_cpu_supports ("clwb"));
> if (ebx & bit_AVX512PF)
> assert (__builtin_cpu_supports ("avx512pf"));
> if (ebx & bit_AVX512ER)
> assert (__builtin_cpu_supports ("avx512er"));
> + if (ebx & bit_AVX512CD)
> + assert (__builtin_cpu_supports ("avx512cd"));
> + if (ebx & bit_SHA)
> + assert (__builtin_cpu_supports ("sha"));
> if (ebx & bit_AVX512BW)
> assert (__builtin_cpu_supports ("avx512bw"));
> - if (ebx & bit_AVX512DQ)
> - assert (__builtin_cpu_supports ("avx512dq"));
> - if (ebx & bit_AVX512IFMA)
> - assert (__builtin_cpu_supports ("avx512ifma"));
> + if (ebx & bit_AVX512VL)
> + assert (__builtin_cpu_supports ("avx512vl"));
> +
> if (ecx & bit_AVX512VBMI)
> assert (__builtin_cpu_supports ("avx512vbmi"));
> + if (ecx & bit_PREFETCHWT1)
> + assert (__builtin_cpu_supports ("prefetchwt1"));
> +
> + __cpuid_count (7, 1, eax, ebx, ecx, edx);
> + if (eax & bit_XSAVEOPT)
> + assert (__builtin_cpu_supports ("xsaveopt"));
> + if (eax & bit_XSAVEC)
> + assert (__builtin_cpu_supports ("xsavec"));
> + if (eax & bit_XSAVES)
> + assert (__builtin_cpu_supports ("xsaves"));
> }
> }
>
> diff --git a/libgcc/config/i386/cpuinfo.c b/libgcc/config/i386/cpuinfo.c
> index 0cbbc85..e928411 100644
> --- a/libgcc/config/i386/cpuinfo.c
> +++ b/libgcc/config/i386/cpuinfo.c
> @@ -23,6 +23,7 @@ a copy of the GCC Runtime Library Exception along with this program;
> see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
> <http://www.gnu.org/licenses/>. */
>
> +#include <stdint.h>
> #include "cpuid.h"
> #include "tsystem.h"
> #include "auto-target.h"
> @@ -113,7 +114,21 @@ enum processor_features
> FEATURE_AVX512ER,
> FEATURE_AVX512PF,
> FEATURE_AVX512VBMI,
> - FEATURE_AVX512IFMA
> + FEATURE_AVX512IFMA,
> + FEATURE_SHA,
> + FEATURE_PREFETCHWT1,
> + FEATURE_FSGSBASE, /* 31 */
> + FEATURE_HLE,
> + FEATURE_RTM,
> + FEATURE_RDSEED,
> + FEATURE_ADX,
> + FEATURE_MPX,
> + FEATURE_CLFLUSHOPT,
> + FEATURE_PCOMMIT,
> + FEATURE_CLWB,
> + FEATURE_XSAVEOPT,
> + FEATURE_XSAVEC,
> + FEATURE_XSAVES
> };
>
> struct __processor_model
> @@ -121,7 +136,7 @@ struct __processor_model
> unsigned int __cpu_vendor;
> unsigned int __cpu_type;
> unsigned int __cpu_subtype;
> - unsigned int __cpu_features[1];
> + uint64_t __cpu_features[1];
> } __cpu_model = { };
>
>
> @@ -290,64 +305,95 @@ static void
> get_available_features (unsigned int ecx, unsigned int edx,
> int max_cpuid_level)
> {
> - unsigned int features = 0;
> + uint64_t features = 0;
>
> if (edx & bit_CMOV)
> - features |= (1 << FEATURE_CMOV);
> + features |= (1ULL << FEATURE_CMOV);
> if (edx & bit_MMX)
> - features |= (1 << FEATURE_MMX);
> + features |= (1ULL << FEATURE_MMX);
> if (edx & bit_SSE)
> - features |= (1 << FEATURE_SSE);
> + features |= (1ULL << FEATURE_SSE);
> if (edx & bit_SSE2)
> - features |= (1 << FEATURE_SSE2);
> + features |= (1ULL << FEATURE_SSE2);
> if (ecx & bit_POPCNT)
> - features |= (1 << FEATURE_POPCNT);
> + features |= (1ULL << FEATURE_POPCNT);
> if (ecx & bit_AES)
> - features |= (1 << FEATURE_AES);
> + features |= (1ULL << FEATURE_AES);
> if (ecx & bit_PCLMUL)
> - features |= (1 << FEATURE_PCLMUL);
> + features |= (1ULL << FEATURE_PCLMUL);
> if (ecx & bit_SSE3)
> - features |= (1 << FEATURE_SSE3);
> + features |= (1ULL << FEATURE_SSE3);
> if (ecx & bit_SSSE3)
> - features |= (1 << FEATURE_SSSE3);
> + features |= (1ULL << FEATURE_SSSE3);
> if (ecx & bit_SSE4_1)
> - features |= (1 << FEATURE_SSE4_1);
> + features |= (1ULL << FEATURE_SSE4_1);
> if (ecx & bit_SSE4_2)
> - features |= (1 << FEATURE_SSE4_2);
> + features |= (1ULL << FEATURE_SSE4_2);
> if (ecx & bit_AVX)
> - features |= (1 << FEATURE_AVX);
> + features |= (1ULL << FEATURE_AVX);
> if (ecx & bit_FMA)
> - features |= (1 << FEATURE_FMA);
> + features |= (1ULL << FEATURE_FMA);
>
> /* Get Advanced Features at level 7 (eax = 7, ecx = 0). */
> if (max_cpuid_level >= 7)
> {
> unsigned int eax, ebx, ecx, edx;
> __cpuid_count (7, 0, eax, ebx, ecx, edx);
> + if (ebx & bit_FSGSBASE)
> + features |= (1ULL << FEATURE_FSGSBASE);
> if (ebx & bit_BMI)
> - features |= (1 << FEATURE_BMI);
> + features |= (1ULL << FEATURE_BMI);
> + if (ebx & bit_HLE)
> + features |= (1ULL << FEATURE_HLE);
> if (ebx & bit_AVX2)
> - features |= (1 << FEATURE_AVX2);
> + features |= (1ULL << FEATURE_AVX2);
> if (ebx & bit_BMI2)
> - features |= (1 << FEATURE_BMI2);
> + features |= (1ULL << FEATURE_BMI2);
> + if (ebx & bit_RTM)
> + features |= (1ULL << FEATURE_RTM);
> + if (ebx & bit_MPX)
> + features |= (1ULL << FEATURE_MPX);
> if (ebx & bit_AVX512F)
> - features |= (1 << FEATURE_AVX512F);
> - if (ebx & bit_AVX512VL)
> - features |= (1 << FEATURE_AVX512VL);
> - if (ebx & bit_AVX512BW)
> - features |= (1 << FEATURE_AVX512BW);
> + features |= (1ULL << FEATURE_AVX512F);
> if (ebx & bit_AVX512DQ)
> - features |= (1 << FEATURE_AVX512DQ);
> - if (ebx & bit_AVX512CD)
> - features |= (1 << FEATURE_AVX512CD);
> + features |= (1ULL << FEATURE_AVX512DQ);
> + if (ebx & bit_RDSEED)
> + features |= (1ULL << FEATURE_RDSEED);
> + if (ebx & bit_ADX)
> + features |= (1ULL << FEATURE_ADX);
> + if (ebx & bit_AVX512IFMA)
> + features |= (1ULL << FEATURE_AVX512IFMA);
> + if (ebx & bit_PCOMMIT)
> + features |= (1ULL << FEATURE_PCOMMIT);
> + if (ebx & bit_CLFLUSHOPT)
> + features |= (1ULL << FEATURE_CLFLUSHOPT);
> + if (ebx & bit_CLWB)
> + features |= (1ULL << FEATURE_CLWB);
> if (ebx & bit_AVX512PF)
> - features |= (1 << FEATURE_AVX512PF);
> + features |= (1ULL << FEATURE_AVX512PF);
> if (ebx & bit_AVX512ER)
> - features |= (1 << FEATURE_AVX512ER);
> - if (ebx & bit_AVX512IFMA)
> - features |= (1 << FEATURE_AVX512IFMA);
> + features |= (1ULL << FEATURE_AVX512ER);
> + if (ebx & bit_AVX512CD)
> + features |= (1ULL << FEATURE_AVX512CD);
> + if (ebx & bit_SHA)
> + features |= (1ULL << FEATURE_SHA);
> + if (ebx & bit_AVX512BW)
> + features |= (1ULL << FEATURE_AVX512BW);
> + if (ebx & bit_AVX512VL)
> + features |= (1ULL << FEATURE_AVX512VL);
> +
> if (ecx & bit_AVX512VBMI)
> - features |= (1 << FEATURE_AVX512VBMI);
> + features |= (1ULL << FEATURE_AVX512VBMI);
> + if (ecx & bit_PREFETCHWT1)
> + features |= (1ULL << FEATURE_PREFETCHWT1);
> +
> + __cpuid_count (7, 1, eax, ebx, ecx, edx);
> + if (eax & bit_XSAVEOPT)
> + features |= (1ULL << FEATURE_XSAVEOPT);
> + if (eax & bit_XSAVEC)
> + features |= (1ULL << FEATURE_XSAVEC);
> + if (eax & bit_XSAVES)
> + features |= (1ULL << FEATURE_XSAVES);
> }
>
> unsigned int ext_level;
> @@ -360,11 +406,11 @@ get_available_features (unsigned int ecx, unsigned int edx,
> __cpuid (0x80000001, eax, ebx, ecx, edx);
>
> if (ecx & bit_SSE4a)
> - features |= (1 << FEATURE_SSE4_A);
> + features |= (1ULL << FEATURE_SSE4_A);
> if (ecx & bit_FMA4)
> - features |= (1 << FEATURE_FMA4);
> + features |= (1ULL << FEATURE_FMA4);
> if (ecx & bit_XOP)
> - features |= (1 << FEATURE_XOP);
> + features |= (1ULL << FEATURE_XOP);
> }
>
> __cpu_model.__cpu_features[0] = features;
More information about the Gcc-patches
mailing list