V2 [PATCH 1/2] Update tunable min/max values

From: "H.J. Lu" <hjl.tools@gmail.com>

  On Fri, Jul 03, 2020 at 03:49:16PM -0400, Carlos O'Donell wrote:
> On 7/3/20 1:52 PM, H.J. Lu wrote:
> > Add __tunable_update_val to update tunable min/max values and move x86
> > processor cache info to cpu_features.
> 
> Nees a little more cleanup. I'd like to avoid more macro APIs if possible.  
> 
> Post v2 please.
> 
> > ---
> >  elf/dl-tunables.c          |  51 ++-
> >  elf/dl-tunables.h          |  15 +
> >  sysdeps/i386/cacheinfo.c   |   3 -
> >  sysdeps/x86/Makefile       |   2 +-
> >  sysdeps/x86/cacheinfo.c    | 852 +++--------------------------------
> >  sysdeps/x86/cpu-features.c |  19 +-
> >  sysdeps/x86/cpu-features.h |  26 ++
> >  sysdeps/x86/dl-cacheinfo.c | 888 +++++++++++++++++++++++++++++++++++++
> >  sysdeps/x86/init-arch.h    |   3 +
> >  9 files changed, 1024 insertions(+), 835 deletions(-)
> >  delete mode 100644 sysdeps/i386/cacheinfo.c
> >  create mode 100644 sysdeps/x86/dl-cacheinfo.c
> > 
> > diff --git a/elf/dl-tunables.c b/elf/dl-tunables.c
> > index 26e6e26612..7c9f1ca31f 100644
> > --- a/elf/dl-tunables.c
> > +++ b/elf/dl-tunables.c
> > @@ -100,31 +100,39 @@ get_next_env (char **envp, char **name, size_t *namelen, char **val,
> >      }									      \
> >  })
> >  
> > +#define TUNABLE_UPDATE_VAL(__cur, __val, __min, __max, __type)		      \
> > +({									      \
> > +  (__cur)->type.min = (__min);						      \
> > +  (__cur)->type.max = (__max);						      \
> > +  (__cur)->val.numval = (__val);					      \
> > +  (__cur)->initialized = true;						      \
> > +})
> 
> Can we update TUNABLE_SET_VAL_IF_VALID_RANGE to take the extra parameters?
> 
> If the value is not within [__min, __max] it should not update numval.

I removed TUNABLE_UPDATE_VAL.

> 
> > +
> >  static void
> > -do_tunable_update_val (tunable_t *cur, const void *valp)
> > +do_tunable_update_val (tunable_t *cur, const void *valp,
> > +		       const void *minp, const void *maxp)
> >  {
> > -  uint64_t val;
> > +  uint64_t val, min, max;
> >  
> >    if (cur->type.type_code != TUNABLE_TYPE_STRING)
> > -    val = *((int64_t *) valp);
> > +    {
> > +      val = *((int64_t *) valp);
> > +      if (minp)
> > +	min = *((int64_t *) minp);
> > +      if (maxp)
> > +	max = *((int64_t *) maxp);
> > +    }
> 
> OK.
> 
> >  
> >    switch (cur->type.type_code)
> >      {
> >      case TUNABLE_TYPE_INT_32:
> > -	{
> > -	  TUNABLE_SET_VAL_IF_VALID_RANGE (cur, val, int64_t);
> > -	  break;
> > -	}
> >      case TUNABLE_TYPE_UINT_64:
> > -	{
> > -	  TUNABLE_SET_VAL_IF_VALID_RANGE (cur, val, uint64_t);
> > -	  break;
> > -	}
> >      case TUNABLE_TYPE_SIZE_T:
> > -	{
> > -	  TUNABLE_SET_VAL_IF_VALID_RANGE (cur, val, uint64_t);
> > -	  break;
> > -	}
> > +      if (minp && maxp)
> > +	TUNABLE_UPDATE_VAL (cur, val, min, max, int64_t);
> > +      else
> > +	TUNABLE_SET_VAL_IF_VALID_RANGE (cur, val, int64_t);
> > +      break;
> 
> Merging the two would result in a one call here and only one macro API
> for set/update. I don't see the requirement for a different set and update.

I left this unchanged.

> 
> >      case TUNABLE_TYPE_STRING:
> >  	{
> >  	  cur->val.strval = valp;
> > @@ -153,7 +161,7 @@ tunable_initialize (tunable_t *cur, const char *strval)
> >        cur->initialized = true;
> >        valp = strval;
> >      }
> > -  do_tunable_update_val (cur, valp);
> > +  do_tunable_update_val (cur, valp, NULL, NULL);
> >  }
> >  
> >  void
> > @@ -161,8 +169,17 @@ __tunable_set_val (tunable_id_t id, void *valp)
> >  {
> >    tunable_t *cur = &tunable_list[id];
> >  
> > -  do_tunable_update_val (cur, valp);
> > +  do_tunable_update_val (cur, valp, NULL, NULL);
> > +}
> > +
> > +void
> > +__tunable_update_val (tunable_id_t id, void *valp, void *minp, void *maxp)
> > +{
> > +  tunable_t *cur = &tunable_list[id];
> > +
> > +  do_tunable_update_val (cur, valp, minp, maxp);
> >  }
> > +rtld_hidden_def (__tunable_update_val)
> >  
> >  #if TUNABLES_FRONTEND == TUNABLES_FRONTEND_valstring
> >  /* Parse the tunable string TUNESTR and adjust it to drop any tunables that may
> > diff --git a/elf/dl-tunables.h b/elf/dl-tunables.h
> > index f05eb50c2f..f6bf7379af 100644
> > --- a/elf/dl-tunables.h
> > +++ b/elf/dl-tunables.h
> > @@ -71,8 +71,10 @@ typedef struct _tunable tunable_t;
> >  extern void __tunables_init (char **);
> >  extern void __tunable_get_val (tunable_id_t, void *, tunable_callback_t);
> >  extern void __tunable_set_val (tunable_id_t, void *);
> > +extern void __tunable_update_val (tunable_id_t, void *, void *, void *);
> >  rtld_hidden_proto (__tunables_init)
> >  rtld_hidden_proto (__tunable_get_val)
> > +rtld_hidden_proto (__tunable_update_val)
> >  
> >  /* Define TUNABLE_GET and TUNABLE_SET in short form if TOP_NAMESPACE and
> >     TUNABLE_NAMESPACE are defined.  This is useful shorthand to get and set
> > @@ -82,11 +84,16 @@ rtld_hidden_proto (__tunable_get_val)
> >    TUNABLE_GET_FULL (TOP_NAMESPACE, TUNABLE_NAMESPACE, __id, __type, __cb)
> >  # define TUNABLE_SET(__id, __type, __val) \
> >    TUNABLE_SET_FULL (TOP_NAMESPACE, TUNABLE_NAMESPACE, __id, __type, __val)
> > +# define TUNABLE_UPDATE(__id, __type, __val, __min, __max) \
> > +  TUNABLE_UPDATE_FULL (TOP_NAMESPACE, TUNABLE_NAMESPACE, __id, __type, \
> > +		       __val, __min, __max)
> 
> Please use TUNABLE_SET?
> 
> I would like avoid needing new macro APIs.
> 
> There doesn't need to be symmetry between TUNABLE_GET and TUNABLE_SET.
> 
> The TUNABLE_GET is for getting the value of the tunable during subsystem
> startup, and the tunable framework handles: setting the default value,
> processing user settings, enforcing minimums, enforcing maximums etc.
> 
> The TUNABLE_SET side doesn't have to be symmetric it may need to set more
> than just the tunable value e.g. min/max.

TUNABLE_SET is needed to only set value.  I added TUNABLE_SET_ALL to
set value as well as min/max.

> 
> > -}
> > -
> > -
> 
> OK.
> 
> >  /* Data cache size for use in memory and string routines, typically
> OK.
> 
> > +
> >  #if HAVE_TUNABLES
> >    TUNABLE_GET (hwcaps, tunable_val_t *, TUNABLE_CALLBACK (set_hwcaps));
> > -  cpu_features->non_temporal_threshold
> > +  long int tunable_size;
> > +  tunable_size = TUNABLE_GET (x86_data_cache_size, long int, NULL);
> > +  if (tunable_size != 0)
> > +    data = tunable_size;
> > +  tunable_size = TUNABLE_GET (x86_shared_cache_size, long int, NULL);
> > +  if (tunable_size != 0)
> > +    shared = tunable_size;
> > +  tunable_size = TUNABLE_GET (x86_non_temporal_threshold, long int, NULL);
> > +  if (tunable_size != 0)
> > +    non_temporal_threshold = tunable_size;
> 
> This is wrong, you have excluded 0 from the list of allowed options?

0 is invalid and means it is unset in tunables.

> Why not raise the dl-tunables.list minimum to 1?
> Then the above code just becomes what we used to have.

What we used to have are

  cpu_features->non_temporal_threshold
    = TUNABLE_GET (x86_non_temporal_threshold, long int, NULL);
...
  __x86_shared_non_temporal_threshold
    = (cpu_features->non_temporal_threshold != 0
       ? cpu_features->non_temporal_threshold
       : __x86_shared_cache_size * threads * 3 / 4);

I just changed the order.

> 
> e.g.
>   cpu_features->non_temporal_threshold
>     = TUNABLE_GET (x86_non_temporal_threshold, long int, NULL);
> 
> The tunables framework should make it so you don't have to write this
> boilerplate.
> 
> There should be only *one* variable that you have to handle specially
> for the dynamic minimum with a TUNABLE_GET + TUNABLE_SET.
> 
> > +#endif
> > +
> > +  cpu_features->data_cache_size = data;
> > +  cpu_features->shared_cache_size = shared;
> > +  cpu_features->non_temporal_threshold = non_temporal_threshold;
> 
> Not needed, you can just fold the cpu_features->foo update like we used
> to have it. The ranges are not being updated to any dynamic values.

The purpose of these changes is to make these values always valid
so that they can be used directly.  Otherwise, they have to be checked
against invalid 0 value before using.

> > +
> > +#if HAVE_TUNABLES
> > +  TUNABLE_UPDATE (x86_data_cache_size, long int,
> > +		  data, 0, (long int) -1);
> > +  TUNABLE_UPDATE (x86_shared_cache_size, long int,
> > +		  shared, 0, (long int) -1);
> > +  TUNABLE_UPDATE (x86_non_temporal_threshold, long int,
> > +		  non_temporal_threshold, 0, (long int) -1);
> 
> Delete all of these. They don't need updating?

Done.

> > +#endif
> > +}
> > diff --git a/sysdeps/x86/init-arch.h b/sysdeps/x86/init-arch.h
> > index d6f59cf962..272ed10902 100644
> > --- a/sysdeps/x86/init-arch.h
> > +++ b/sysdeps/x86/init-arch.h
> > @@ -23,6 +23,9 @@
> >  #include <ifunc-init.h>
> >  #include <isa.h>
> >  
> > +extern void __init_cacheinfo (void)
> > +  __attribute__ ((visibility ("hidden")));
> > +
> >  #ifndef __x86_64__
> >  /* Due to the reordering and the other nifty extensions in i686, it is
> >     not really good to use heavily i586 optimized code on an i686.  It's
> > 

H.J.
---
From b66f08560b08ad1d718b3d19a8b0bee66c08ba49 Mon Sep 17 00:00:00 2001
From: "H.J. Lu" <hjl.tools@gmail.com>
Date: Mon, 1 Jun 2020 14:11:32 -0700
Subject: [PATCH 1/2] Set tunable value as well as min/max values

Update __tunable_set_val to set tunable value as well as min/max values.
TUNABLE_SET_ALL macro is added, but not used.  Move x86 processor cache
info to cpu_features.
---
 elf/dl-tunables.c          |  20 +-
 elf/dl-tunables.h          |  18 +-
 sysdeps/i386/cacheinfo.c   |   3 -
 sysdeps/x86/Makefile       |   2 +-
 sysdeps/x86/cacheinfo.c    | 852 +++--------------------------------
 sysdeps/x86/cpu-features.c |  19 +-
 sysdeps/x86/cpu-features.h |  26 ++
 sysdeps/x86/dl-cacheinfo.c | 879 +++++++++++++++++++++++++++++++++++++
 sysdeps/x86/init-arch.h    |   3 +
 9 files changed, 996 insertions(+), 826 deletions(-)
 delete mode 100644 sysdeps/i386/cacheinfo.c
 create mode 100644 sysdeps/x86/dl-cacheinfo.c

Message ID	20200703230951.GA1301408@gmail.com
State	Superseded
Headers	Return-Path: <libc-alpha-bounces@sourceware.org> X-Original-To: patchwork@sourceware.org Delivered-To: patchwork@sourceware.org Received: from server2.sourceware.org (localhost [IPv6:::1]) by sourceware.org (Postfix) with ESMTP id 1F51A3851C09; Fri, 3 Jul 2020 23:10:02 +0000 (GMT) DKIM-Filter: OpenDKIM Filter v2.11.0 sourceware.org 1F51A3851C09 DKIM-Signature: v=1; a=rsa-sha256; c=relaxed/relaxed; d=sourceware.org; s=default; t=1593817802; bh=QurbJDFeSqcEJ+WIIDJBl21uAd2cX0H3pTJOVeWYyAI=; h=Date:To:Subject:References:In-Reply-To:List-Id:List-Unsubscribe: List-Archive:List-Post:List-Help:List-Subscribe:From:Reply-To:Cc: From; b=JzHdC7M/MixZDfrfUr/dUCeaVagp+CwIYWphZxirul3lg1NWAGQI6s0d39NMTKvzA ExpwGaeblbBTD0SlpHZndxhFeWtJMukTbnHHB5fWH+KwhJB4tygUxB3Gwepi5Fu05q uzF/jzXEBZ6ZBXV/yvpFnLBUov5QrHO41WHYNuk0= X-Original-To: libc-alpha@sourceware.org Delivered-To: libc-alpha@sourceware.org Received: from mail-pg1-x530.google.com (mail-pg1-x530.google.com [IPv6:2607:f8b0:4864:20::530]) by sourceware.org (Postfix) with ESMTPS id 4E08B3851C09 for <libc-alpha@sourceware.org>; Fri, 3 Jul 2020 23:09:54 +0000 (GMT) DMARC-Filter: OpenDMARC Filter v1.3.2 sourceware.org 4E08B3851C09 Received: by mail-pg1-x530.google.com with SMTP id e18so15689743pgn.7 for <libc-alpha@sourceware.org>; Fri, 03 Jul 2020 16:09:54 -0700 (PDT) X-Google-DKIM-Signature: v=1; a=rsa-sha256; c=relaxed/relaxed; d=1e100.net; s=20161025; h=x-gm-message-state:date:from:to:cc:subject:message-id:references :mime-version:content-disposition:in-reply-to; bh=QurbJDFeSqcEJ+WIIDJBl21uAd2cX0H3pTJOVeWYyAI=; b=OYnOq/wvYM917ra09aquqtOz5Gl+98qkqmjrCfQwku4KYwPI+NTyuMqPUAriXCfT6d aTEL9wxgfFd6P5+2UcEVTiWwQYEdu3q9ydWEj0CbRPPEoO9SI02ms7rH8Lz/77z+F06p tVpxYEsIzdonpCZq78uoPsLhZeBVQ2FnFSyEengV3CmDLVXMDWzoxI7S480qUaxBhvxJ coSF87nVcu0JjXYEwsHXUE3k3u3sHhThhHc9S2NBP1HobKUrhSkmbcozpD7X7X9oANmo iFuYKWN4SOEKDz1837VKOPwUn9nxqOr8d6Ahm/jUh0PJkMiYP7Wh2svTvxbHdkMU16fI EjFw== X-Gm-Message-State: AOAM533INu3uS8182e/BrVj1M7j2wygLhf+XYMP3d5YW8DohC0MMMlvS vdAEJLpz68VfVc8ZPe7uCqo= X-Google-Smtp-Source: ABdhPJwsKNQPrsFy2Ean11BLqXLShZwyj9fGo9+lbYSDXRvuo+4tg/QBxuXk9pZmlfDehkbEK66FFQ== X-Received: by 2002:a63:fc59:: with SMTP id r25mr7921857pgk.336.1593817792899; Fri, 03 Jul 2020 16:09:52 -0700 (PDT) Received: from gnu-cfl-2.localdomain (c-69-181-90-243.hsd1.ca.comcast.net. [69.181.90.243]) by smtp.gmail.com with ESMTPSA id r8sm11607792pfh.29.2020.07.03.16.09.52 (version=TLS1_3 cipher=TLS_AES_256_GCM_SHA384 bits=256/256); Fri, 03 Jul 2020 16:09:52 -0700 (PDT) Received: by gnu-cfl-2.localdomain (Postfix, from userid 1000) id 5B8341A0509; Fri, 3 Jul 2020 16:09:51 -0700 (PDT) Date: Fri, 3 Jul 2020 16:09:51 -0700 To: Carlos O'Donell <carlos@redhat.com> Subject: V2 [PATCH 1/2] Update tunable min/max values Message-ID: <20200703230951.GA1301408@gmail.com> References: <20200703175220.1178840-1-hjl.tools@gmail.com> <20200703175220.1178840-2-hjl.tools@gmail.com> <cc15fba0-0fc1-d0fa-3895-fda3bafb8f1b@redhat.com> MIME-Version: 1.0 Content-Type: text/plain; charset=us-ascii Content-Disposition: inline In-Reply-To: <cc15fba0-0fc1-d0fa-3895-fda3bafb8f1b@redhat.com> X-Spam-Status: No, score=-13.0 required=5.0 tests=BAYES_00, DKIM_SIGNED, DKIM_VALID, DKIM_VALID_AU, DKIM_VALID_EF, FREEMAIL_FROM, GIT_PATCH_0, KAM_SHORT, RCVD_IN_DNSWL_NONE, SPF_HELO_NONE, SPF_PASS, TXREP autolearn=ham autolearn_force=no version=3.4.2 X-Spam-Checker-Version: SpamAssassin 3.4.2 (2018-09-13) on server2.sourceware.org X-BeenThere: libc-alpha@sourceware.org X-Mailman-Version: 2.1.29 Precedence: list List-Id: Libc-alpha mailing list <libc-alpha.sourceware.org> List-Unsubscribe: <http://sourceware.org/mailman/options/libc-alpha>, <mailto:libc-alpha-request@sourceware.org?subject=unsubscribe> List-Archive: <https://sourceware.org/pipermail/libc-alpha/> List-Post: <mailto:libc-alpha@sourceware.org> List-Help: <mailto:libc-alpha-request@sourceware.org?subject=help> List-Subscribe: <http://sourceware.org/mailman/listinfo/libc-alpha>, <mailto:libc-alpha-request@sourceware.org?subject=subscribe> From: "H.J. Lu via Libc-alpha" <libc-alpha@sourceware.org> Reply-To: "H.J. Lu" <hjl.tools@gmail.com> Cc: libc-alpha@sourceware.org Errors-To: libc-alpha-bounces@sourceware.org Sender: "Libc-alpha" <libc-alpha-bounces@sourceware.org>
Series	V2 [PATCH 1/2] Update tunable min/max values \| V2 [PATCH 1/2] Update tunable min/max values

V2 [PATCH 1/2] Update tunable min/max values

Commit Message

Comments

Patch