x86: Don't use dl_x86_cpu_features in cacheinfo.c

Message ID 20170524200941.GA30586@lucon.org
State New, archived
Headers

Commit Message

Lu, Hongjiu May 24, 2017, 8:09 p.m. UTC
  Since cpu_features is available, use it instead of dl_x86_cpu_features.

Any comments?

H.J.
---
	* sysdeps/x86/cacheinfo.c (intel_check_word): Accept cpu_features
	and use it instead of dl_x86_cpu_features.
	(handle_intel): Replace maxidx with cpu_features.  Pass
	cpu_features to intel_check_word.
	(__cache_sysconf): Pass cpu_features to handle_intel.
	(init_cacheinfo): Likewise.  Use cpu_features instead of
	dl_x86_cpu_features.
---
 sysdeps/x86/cacheinfo.c | 37 ++++++++++++++++++++++---------------
 1 file changed, 22 insertions(+), 15 deletions(-)
  

Comments

H.J. Lu May 31, 2017, 7:48 p.m. UTC | #1
On Wed, May 24, 2017 at 1:09 PM, H.J. Lu <hongjiu.lu@intel.com> wrote:
> Since cpu_features is available, use it instead of dl_x86_cpu_features.
>
> Any comments?

Any objections?

> H.J.
> ---
>         * sysdeps/x86/cacheinfo.c (intel_check_word): Accept cpu_features
>         and use it instead of dl_x86_cpu_features.
>         (handle_intel): Replace maxidx with cpu_features.  Pass
>         cpu_features to intel_check_word.
>         (__cache_sysconf): Pass cpu_features to handle_intel.
>         (init_cacheinfo): Likewise.  Use cpu_features instead of
>         dl_x86_cpu_features.
> ---
>  sysdeps/x86/cacheinfo.c | 37 ++++++++++++++++++++++---------------
>  1 file changed, 22 insertions(+), 15 deletions(-)
>
> diff --git a/sysdeps/x86/cacheinfo.c b/sysdeps/x86/cacheinfo.c
> index 321fbb6..a46dd4d 100644
> --- a/sysdeps/x86/cacheinfo.c
> +++ b/sysdeps/x86/cacheinfo.c
> @@ -126,7 +126,8 @@ intel_02_known_compare (const void *p1, const void *p2)
>  static long int
>  __attribute__ ((noinline))
>  intel_check_word (int name, unsigned int value, bool *has_level_2,
> -                 bool *no_level_2_or_3)
> +                 bool *no_level_2_or_3,
> +                 const struct cpu_features *cpu_features)
>  {
>    if ((value & 0x80000000) != 0)
>      /* The register value is reserved.  */
> @@ -204,8 +205,8 @@ intel_check_word (int name, unsigned int value, bool *has_level_2,
>               /* Intel reused this value.  For family 15, model 6 it
>                  specifies the 3rd level cache.  Otherwise the 2nd
>                  level cache.  */
> -             unsigned int family = GLRO(dl_x86_cpu_features).family;
> -             unsigned int model = GLRO(dl_x86_cpu_features).model;
> +             unsigned int family = cpu_features->family;
> +             unsigned int model = cpu_features->model;
>
>               if (family == 15 && model == 6)
>                 {
> @@ -255,8 +256,10 @@ intel_check_word (int name, unsigned int value, bool *has_level_2,
>
>
>  static long int __attribute__ ((noinline))
> -handle_intel (int name, unsigned int maxidx)
> +handle_intel (int name, const struct cpu_features *cpu_features)
>  {
> +  unsigned int maxidx = cpu_features->max_cpuid;
> +
>    /* Return -1 for older CPUs.  */
>    if (maxidx < 2)
>      return -1;
> @@ -287,19 +290,23 @@ handle_intel (int name, unsigned int maxidx)
>         }
>
>        /* Process the individual registers' value.  */
> -      result = intel_check_word (name, eax, &has_level_2, &no_level_2_or_3);
> +      result = intel_check_word (name, eax, &has_level_2,
> +                                &no_level_2_or_3, cpu_features);
>        if (result != 0)
>         return result;
>
> -      result = intel_check_word (name, ebx, &has_level_2, &no_level_2_or_3);
> +      result = intel_check_word (name, ebx, &has_level_2,
> +                                &no_level_2_or_3, cpu_features);
>        if (result != 0)
>         return result;
>
> -      result = intel_check_word (name, ecx, &has_level_2, &no_level_2_or_3);
> +      result = intel_check_word (name, ecx, &has_level_2,
> +                                &no_level_2_or_3, cpu_features);
>        if (result != 0)
>         return result;
>
> -      result = intel_check_word (name, edx, &has_level_2, &no_level_2_or_3);
> +      result = intel_check_word (name, edx, &has_level_2,
> +                                &no_level_2_or_3, cpu_features);
>        if (result != 0)
>         return result;
>      }
> @@ -437,7 +444,7 @@ __cache_sysconf (int name)
>    const struct cpu_features *cpu_features = __get_cpu_features ();
>
>    if (cpu_features->kind == arch_kind_intel)
> -    return handle_intel (name, cpu_features->max_cpuid);
> +    return handle_intel (name, cpu_features);
>
>    if (cpu_features->kind == arch_kind_amd)
>      return handle_amd (name);
> @@ -494,14 +501,14 @@ init_cacheinfo (void)
>
>    if (cpu_features->kind == arch_kind_intel)
>      {
> -      data = handle_intel (_SC_LEVEL1_DCACHE_SIZE, max_cpuid);
> +      data = handle_intel (_SC_LEVEL1_DCACHE_SIZE, cpu_features);
>
> -      long int core = handle_intel (_SC_LEVEL2_CACHE_SIZE, max_cpuid);
> +      long int core = handle_intel (_SC_LEVEL2_CACHE_SIZE, cpu_features);
>        bool inclusive_cache = true;
>
>        /* Try L3 first.  */
>        level  = 3;
> -      shared = handle_intel (_SC_LEVEL3_CACHE_SIZE, max_cpuid);
> +      shared = handle_intel (_SC_LEVEL3_CACHE_SIZE, cpu_features);
>
>        /* Number of logical processors sharing L2 cache.  */
>        int threads_l2;
> @@ -531,8 +538,8 @@ init_cacheinfo (void)
>              highest cache level.  */
>           if (max_cpuid >= 4)
>             {
> -             unsigned int family = GLRO(dl_x86_cpu_features).family;
> -             unsigned int model = GLRO(dl_x86_cpu_features).model;
> +             unsigned int family = cpu_features->family;
> +             unsigned int model = cpu_features->model;
>
>               int i = 0;
>
> @@ -675,7 +682,7 @@ intel_bug_no_cache_info:
>                  level.  */
>
>               threads
> -               = ((GLRO(dl_x86_cpu_features).cpuid[COMMON_CPUID_INDEX_1].ebx
> +               = ((cpu_features->cpuid[COMMON_CPUID_INDEX_1].ebx
>                     >> 16) & 0xff);
>             }
>
> --
> 2.9.4
>
  
H.J. Lu June 5, 2017, 11:19 p.m. UTC | #2
On Wed, May 31, 2017 at 12:48 PM, H.J. Lu <hjl.tools@gmail.com> wrote:
> On Wed, May 24, 2017 at 1:09 PM, H.J. Lu <hongjiu.lu@intel.com> wrote:
>> Since cpu_features is available, use it instead of dl_x86_cpu_features.
>>
>> Any comments?
>
> Any objections?

I am checking it in now.

>> H.J.
>> ---
>>         * sysdeps/x86/cacheinfo.c (intel_check_word): Accept cpu_features
>>         and use it instead of dl_x86_cpu_features.
>>         (handle_intel): Replace maxidx with cpu_features.  Pass
>>         cpu_features to intel_check_word.
>>         (__cache_sysconf): Pass cpu_features to handle_intel.
>>         (init_cacheinfo): Likewise.  Use cpu_features instead of
>>         dl_x86_cpu_features.
>> ---
>>  sysdeps/x86/cacheinfo.c | 37 ++++++++++++++++++++++---------------
>>  1 file changed, 22 insertions(+), 15 deletions(-)
>>
>> diff --git a/sysdeps/x86/cacheinfo.c b/sysdeps/x86/cacheinfo.c
>> index 321fbb6..a46dd4d 100644
>> --- a/sysdeps/x86/cacheinfo.c
>> +++ b/sysdeps/x86/cacheinfo.c
>> @@ -126,7 +126,8 @@ intel_02_known_compare (const void *p1, const void *p2)
>>  static long int
>>  __attribute__ ((noinline))
>>  intel_check_word (int name, unsigned int value, bool *has_level_2,
>> -                 bool *no_level_2_or_3)
>> +                 bool *no_level_2_or_3,
>> +                 const struct cpu_features *cpu_features)
>>  {
>>    if ((value & 0x80000000) != 0)
>>      /* The register value is reserved.  */
>> @@ -204,8 +205,8 @@ intel_check_word (int name, unsigned int value, bool *has_level_2,
>>               /* Intel reused this value.  For family 15, model 6 it
>>                  specifies the 3rd level cache.  Otherwise the 2nd
>>                  level cache.  */
>> -             unsigned int family = GLRO(dl_x86_cpu_features).family;
>> -             unsigned int model = GLRO(dl_x86_cpu_features).model;
>> +             unsigned int family = cpu_features->family;
>> +             unsigned int model = cpu_features->model;
>>
>>               if (family == 15 && model == 6)
>>                 {
>> @@ -255,8 +256,10 @@ intel_check_word (int name, unsigned int value, bool *has_level_2,
>>
>>
>>  static long int __attribute__ ((noinline))
>> -handle_intel (int name, unsigned int maxidx)
>> +handle_intel (int name, const struct cpu_features *cpu_features)
>>  {
>> +  unsigned int maxidx = cpu_features->max_cpuid;
>> +
>>    /* Return -1 for older CPUs.  */
>>    if (maxidx < 2)
>>      return -1;
>> @@ -287,19 +290,23 @@ handle_intel (int name, unsigned int maxidx)
>>         }
>>
>>        /* Process the individual registers' value.  */
>> -      result = intel_check_word (name, eax, &has_level_2, &no_level_2_or_3);
>> +      result = intel_check_word (name, eax, &has_level_2,
>> +                                &no_level_2_or_3, cpu_features);
>>        if (result != 0)
>>         return result;
>>
>> -      result = intel_check_word (name, ebx, &has_level_2, &no_level_2_or_3);
>> +      result = intel_check_word (name, ebx, &has_level_2,
>> +                                &no_level_2_or_3, cpu_features);
>>        if (result != 0)
>>         return result;
>>
>> -      result = intel_check_word (name, ecx, &has_level_2, &no_level_2_or_3);
>> +      result = intel_check_word (name, ecx, &has_level_2,
>> +                                &no_level_2_or_3, cpu_features);
>>        if (result != 0)
>>         return result;
>>
>> -      result = intel_check_word (name, edx, &has_level_2, &no_level_2_or_3);
>> +      result = intel_check_word (name, edx, &has_level_2,
>> +                                &no_level_2_or_3, cpu_features);
>>        if (result != 0)
>>         return result;
>>      }
>> @@ -437,7 +444,7 @@ __cache_sysconf (int name)
>>    const struct cpu_features *cpu_features = __get_cpu_features ();
>>
>>    if (cpu_features->kind == arch_kind_intel)
>> -    return handle_intel (name, cpu_features->max_cpuid);
>> +    return handle_intel (name, cpu_features);
>>
>>    if (cpu_features->kind == arch_kind_amd)
>>      return handle_amd (name);
>> @@ -494,14 +501,14 @@ init_cacheinfo (void)
>>
>>    if (cpu_features->kind == arch_kind_intel)
>>      {
>> -      data = handle_intel (_SC_LEVEL1_DCACHE_SIZE, max_cpuid);
>> +      data = handle_intel (_SC_LEVEL1_DCACHE_SIZE, cpu_features);
>>
>> -      long int core = handle_intel (_SC_LEVEL2_CACHE_SIZE, max_cpuid);
>> +      long int core = handle_intel (_SC_LEVEL2_CACHE_SIZE, cpu_features);
>>        bool inclusive_cache = true;
>>
>>        /* Try L3 first.  */
>>        level  = 3;
>> -      shared = handle_intel (_SC_LEVEL3_CACHE_SIZE, max_cpuid);
>> +      shared = handle_intel (_SC_LEVEL3_CACHE_SIZE, cpu_features);
>>
>>        /* Number of logical processors sharing L2 cache.  */
>>        int threads_l2;
>> @@ -531,8 +538,8 @@ init_cacheinfo (void)
>>              highest cache level.  */
>>           if (max_cpuid >= 4)
>>             {
>> -             unsigned int family = GLRO(dl_x86_cpu_features).family;
>> -             unsigned int model = GLRO(dl_x86_cpu_features).model;
>> +             unsigned int family = cpu_features->family;
>> +             unsigned int model = cpu_features->model;
>>
>>               int i = 0;
>>
>> @@ -675,7 +682,7 @@ intel_bug_no_cache_info:
>>                  level.  */
>>
>>               threads
>> -               = ((GLRO(dl_x86_cpu_features).cpuid[COMMON_CPUID_INDEX_1].ebx
>> +               = ((cpu_features->cpuid[COMMON_CPUID_INDEX_1].ebx
>>                     >> 16) & 0xff);
>>             }
>>
>> --
>> 2.9.4
>>
>
>
>
> --
> H.J.
  

Patch

diff --git a/sysdeps/x86/cacheinfo.c b/sysdeps/x86/cacheinfo.c
index 321fbb6..a46dd4d 100644
--- a/sysdeps/x86/cacheinfo.c
+++ b/sysdeps/x86/cacheinfo.c
@@ -126,7 +126,8 @@  intel_02_known_compare (const void *p1, const void *p2)
 static long int
 __attribute__ ((noinline))
 intel_check_word (int name, unsigned int value, bool *has_level_2,
-		  bool *no_level_2_or_3)
+		  bool *no_level_2_or_3,
+		  const struct cpu_features *cpu_features)
 {
   if ((value & 0x80000000) != 0)
     /* The register value is reserved.  */
@@ -204,8 +205,8 @@  intel_check_word (int name, unsigned int value, bool *has_level_2,
 	      /* Intel reused this value.  For family 15, model 6 it
 		 specifies the 3rd level cache.  Otherwise the 2nd
 		 level cache.  */
-	      unsigned int family = GLRO(dl_x86_cpu_features).family;
-	      unsigned int model = GLRO(dl_x86_cpu_features).model;
+	      unsigned int family = cpu_features->family;
+	      unsigned int model = cpu_features->model;
 
 	      if (family == 15 && model == 6)
 		{
@@ -255,8 +256,10 @@  intel_check_word (int name, unsigned int value, bool *has_level_2,
 
 
 static long int __attribute__ ((noinline))
-handle_intel (int name, unsigned int maxidx)
+handle_intel (int name, const struct cpu_features *cpu_features)
 {
+  unsigned int maxidx = cpu_features->max_cpuid;
+
   /* Return -1 for older CPUs.  */
   if (maxidx < 2)
     return -1;
@@ -287,19 +290,23 @@  handle_intel (int name, unsigned int maxidx)
 	}
 
       /* Process the individual registers' value.  */
-      result = intel_check_word (name, eax, &has_level_2, &no_level_2_or_3);
+      result = intel_check_word (name, eax, &has_level_2,
+				 &no_level_2_or_3, cpu_features);
       if (result != 0)
 	return result;
 
-      result = intel_check_word (name, ebx, &has_level_2, &no_level_2_or_3);
+      result = intel_check_word (name, ebx, &has_level_2,
+				 &no_level_2_or_3, cpu_features);
       if (result != 0)
 	return result;
 
-      result = intel_check_word (name, ecx, &has_level_2, &no_level_2_or_3);
+      result = intel_check_word (name, ecx, &has_level_2,
+				 &no_level_2_or_3, cpu_features);
       if (result != 0)
 	return result;
 
-      result = intel_check_word (name, edx, &has_level_2, &no_level_2_or_3);
+      result = intel_check_word (name, edx, &has_level_2,
+				 &no_level_2_or_3, cpu_features);
       if (result != 0)
 	return result;
     }
@@ -437,7 +444,7 @@  __cache_sysconf (int name)
   const struct cpu_features *cpu_features = __get_cpu_features ();
 
   if (cpu_features->kind == arch_kind_intel)
-    return handle_intel (name, cpu_features->max_cpuid);
+    return handle_intel (name, cpu_features);
 
   if (cpu_features->kind == arch_kind_amd)
     return handle_amd (name);
@@ -494,14 +501,14 @@  init_cacheinfo (void)
 
   if (cpu_features->kind == arch_kind_intel)
     {
-      data = handle_intel (_SC_LEVEL1_DCACHE_SIZE, max_cpuid);
+      data = handle_intel (_SC_LEVEL1_DCACHE_SIZE, cpu_features);
 
-      long int core = handle_intel (_SC_LEVEL2_CACHE_SIZE, max_cpuid);
+      long int core = handle_intel (_SC_LEVEL2_CACHE_SIZE, cpu_features);
       bool inclusive_cache = true;
 
       /* Try L3 first.  */
       level  = 3;
-      shared = handle_intel (_SC_LEVEL3_CACHE_SIZE, max_cpuid);
+      shared = handle_intel (_SC_LEVEL3_CACHE_SIZE, cpu_features);
 
       /* Number of logical processors sharing L2 cache.  */
       int threads_l2;
@@ -531,8 +538,8 @@  init_cacheinfo (void)
 	     highest cache level.  */
 	  if (max_cpuid >= 4)
 	    {
-	      unsigned int family = GLRO(dl_x86_cpu_features).family;
-	      unsigned int model = GLRO(dl_x86_cpu_features).model;
+	      unsigned int family = cpu_features->family;
+	      unsigned int model = cpu_features->model;
 
 	      int i = 0;
 
@@ -675,7 +682,7 @@  intel_bug_no_cache_info:
 		 level.  */
 
 	      threads
-		= ((GLRO(dl_x86_cpu_features).cpuid[COMMON_CPUID_INDEX_1].ebx
+		= ((cpu_features->cpuid[COMMON_CPUID_INDEX_1].ebx
 		    >> 16) & 0xff);
 	    }