This is the mail archive of the
libc-alpha@sourceware.org
mailing list for the glibc project.
Re: [PATCH] x86: Don't use dl_x86_cpu_features in cacheinfo.c
- From: "H.J. Lu" <hjl dot tools at gmail dot com>
- To: GNU C Library <libc-alpha at sourceware dot org>
- Date: Mon, 5 Jun 2017 16:19:08 -0700
- Subject: Re: [PATCH] x86: Don't use dl_x86_cpu_features in cacheinfo.c
- Authentication-results: sourceware.org; auth=none
- References: <20170524200941.GA30586@lucon.org> <CAMe9rOrvSC3bPU9bCygcXB7KF4sxu3T8SXdkYkZgD-6Vtu+fhA@mail.gmail.com>
On Wed, May 31, 2017 at 12:48 PM, H.J. Lu <hjl.tools@gmail.com> wrote:
> On Wed, May 24, 2017 at 1:09 PM, H.J. Lu <hongjiu.lu@intel.com> wrote:
>> Since cpu_features is available, use it instead of dl_x86_cpu_features.
>>
>> Any comments?
>
> Any objections?
I am checking it in now.
>> H.J.
>> ---
>> * sysdeps/x86/cacheinfo.c (intel_check_word): Accept cpu_features
>> and use it instead of dl_x86_cpu_features.
>> (handle_intel): Replace maxidx with cpu_features. Pass
>> cpu_features to intel_check_word.
>> (__cache_sysconf): Pass cpu_features to handle_intel.
>> (init_cacheinfo): Likewise. Use cpu_features instead of
>> dl_x86_cpu_features.
>> ---
>> sysdeps/x86/cacheinfo.c | 37 ++++++++++++++++++++++---------------
>> 1 file changed, 22 insertions(+), 15 deletions(-)
>>
>> diff --git a/sysdeps/x86/cacheinfo.c b/sysdeps/x86/cacheinfo.c
>> index 321fbb6..a46dd4d 100644
>> --- a/sysdeps/x86/cacheinfo.c
>> +++ b/sysdeps/x86/cacheinfo.c
>> @@ -126,7 +126,8 @@ intel_02_known_compare (const void *p1, const void *p2)
>> static long int
>> __attribute__ ((noinline))
>> intel_check_word (int name, unsigned int value, bool *has_level_2,
>> - bool *no_level_2_or_3)
>> + bool *no_level_2_or_3,
>> + const struct cpu_features *cpu_features)
>> {
>> if ((value & 0x80000000) != 0)
>> /* The register value is reserved. */
>> @@ -204,8 +205,8 @@ intel_check_word (int name, unsigned int value, bool *has_level_2,
>> /* Intel reused this value. For family 15, model 6 it
>> specifies the 3rd level cache. Otherwise the 2nd
>> level cache. */
>> - unsigned int family = GLRO(dl_x86_cpu_features).family;
>> - unsigned int model = GLRO(dl_x86_cpu_features).model;
>> + unsigned int family = cpu_features->family;
>> + unsigned int model = cpu_features->model;
>>
>> if (family == 15 && model == 6)
>> {
>> @@ -255,8 +256,10 @@ intel_check_word (int name, unsigned int value, bool *has_level_2,
>>
>>
>> static long int __attribute__ ((noinline))
>> -handle_intel (int name, unsigned int maxidx)
>> +handle_intel (int name, const struct cpu_features *cpu_features)
>> {
>> + unsigned int maxidx = cpu_features->max_cpuid;
>> +
>> /* Return -1 for older CPUs. */
>> if (maxidx < 2)
>> return -1;
>> @@ -287,19 +290,23 @@ handle_intel (int name, unsigned int maxidx)
>> }
>>
>> /* Process the individual registers' value. */
>> - result = intel_check_word (name, eax, &has_level_2, &no_level_2_or_3);
>> + result = intel_check_word (name, eax, &has_level_2,
>> + &no_level_2_or_3, cpu_features);
>> if (result != 0)
>> return result;
>>
>> - result = intel_check_word (name, ebx, &has_level_2, &no_level_2_or_3);
>> + result = intel_check_word (name, ebx, &has_level_2,
>> + &no_level_2_or_3, cpu_features);
>> if (result != 0)
>> return result;
>>
>> - result = intel_check_word (name, ecx, &has_level_2, &no_level_2_or_3);
>> + result = intel_check_word (name, ecx, &has_level_2,
>> + &no_level_2_or_3, cpu_features);
>> if (result != 0)
>> return result;
>>
>> - result = intel_check_word (name, edx, &has_level_2, &no_level_2_or_3);
>> + result = intel_check_word (name, edx, &has_level_2,
>> + &no_level_2_or_3, cpu_features);
>> if (result != 0)
>> return result;
>> }
>> @@ -437,7 +444,7 @@ __cache_sysconf (int name)
>> const struct cpu_features *cpu_features = __get_cpu_features ();
>>
>> if (cpu_features->kind == arch_kind_intel)
>> - return handle_intel (name, cpu_features->max_cpuid);
>> + return handle_intel (name, cpu_features);
>>
>> if (cpu_features->kind == arch_kind_amd)
>> return handle_amd (name);
>> @@ -494,14 +501,14 @@ init_cacheinfo (void)
>>
>> if (cpu_features->kind == arch_kind_intel)
>> {
>> - data = handle_intel (_SC_LEVEL1_DCACHE_SIZE, max_cpuid);
>> + data = handle_intel (_SC_LEVEL1_DCACHE_SIZE, cpu_features);
>>
>> - long int core = handle_intel (_SC_LEVEL2_CACHE_SIZE, max_cpuid);
>> + long int core = handle_intel (_SC_LEVEL2_CACHE_SIZE, cpu_features);
>> bool inclusive_cache = true;
>>
>> /* Try L3 first. */
>> level = 3;
>> - shared = handle_intel (_SC_LEVEL3_CACHE_SIZE, max_cpuid);
>> + shared = handle_intel (_SC_LEVEL3_CACHE_SIZE, cpu_features);
>>
>> /* Number of logical processors sharing L2 cache. */
>> int threads_l2;
>> @@ -531,8 +538,8 @@ init_cacheinfo (void)
>> highest cache level. */
>> if (max_cpuid >= 4)
>> {
>> - unsigned int family = GLRO(dl_x86_cpu_features).family;
>> - unsigned int model = GLRO(dl_x86_cpu_features).model;
>> + unsigned int family = cpu_features->family;
>> + unsigned int model = cpu_features->model;
>>
>> int i = 0;
>>
>> @@ -675,7 +682,7 @@ intel_bug_no_cache_info:
>> level. */
>>
>> threads
>> - = ((GLRO(dl_x86_cpu_features).cpuid[COMMON_CPUID_INDEX_1].ebx
>> + = ((cpu_features->cpuid[COMMON_CPUID_INDEX_1].ebx
>> >> 16) & 0xff);
>> }
>>
>> --
>> 2.9.4
>>
>
>
>
> --
> H.J.
--
H.J.