/* Initialize cpu feature data.  s390x version.
   Copyright (C) 2023-2025 Free Software Foundation, Inc.
   This file is part of the GNU C Library.
   The GNU C Library is free software; you can redistribute it and/or
   modify it under the terms of the GNU Lesser General Public
   License as published by the Free Software Foundation; either
   version 2.1 of the License, or (at your option) any later version.
   The GNU C Library is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   Lesser General Public License for more details.
   You should have received a copy of the GNU Lesser General Public
   License along with the GNU C Library; if not, see
   .  */
#include 
#include 
#include 
#include 
#include 
#include 
#include 
#include 
#define S390_COPY_CPU_FEATURES(SRC_PTR, DEST_PTR)	\
  (DEST_PTR)->hwcap = (SRC_PTR)->hwcap;			\
  (DEST_PTR)->stfle_filtered = (SRC_PTR)->stfle_filtered;
static void
TUNABLE_CALLBACK (set_hwcaps) (tunable_val_t *valp)
{
  /* The current IFUNC selection is always using the most recent
     features which are available via AT_HWCAP or STFLE-bits.  But in
     some scenarios it is useful to adjust this selection.
     The environment variable:
     GLIBC_TUNABLES=glibc.cpu.hwcaps=-xxx,yyy,zzz,....
     can be used to enable HWCAP/STFLE feature yyy, disable HWCAP/STFLE feature
     xxx, where the feature name is case-sensitive and has to match the ones
     used below.  Furthermore, the ARCH-level zzz can be used to set various
     HWCAP/STFLE features at once.  */
  /* Copy the features from dl_s390_cpu_features, which contains the features
     provided by AT_HWCAP and stfle-instruction.  */
  struct cpu_features *cpu_features = &GLRO(dl_s390_cpu_features);
  struct cpu_features cpu_features_orig;
  S390_COPY_CPU_FEATURES (cpu_features, &cpu_features_orig);
  struct cpu_features cpu_features_curr;
  S390_COPY_CPU_FEATURES (cpu_features, &cpu_features_curr);
  struct tunable_str_comma_state_t ts;
  tunable_str_comma_init (&ts, valp);
  struct tunable_str_comma_t t;
  while (tunable_str_comma_next (&ts, &t))
    {
      if (t.len == 0)
	continue;
      /* Handle only the features here which are really used in the
	 IFUNC-resolvers.  All others are ignored as the values are only used
	 inside glibc.  */
      bool reset_features = false;
      unsigned long int hwcap_mask = 0UL;
      unsigned long long stfle_bits0_mask = 0ULL;
      bool disable = t.disable;
      if (tunable_str_comma_strcmp_cte (&t, "zEC12")
	  || tunable_str_comma_strcmp_cte (&t, "arch10"))
	{
	  reset_features = true;
	  disable = true;
	  hwcap_mask = HWCAP_S390_VXRS | HWCAP_S390_VXRS_EXT
	    | HWCAP_S390_VXRS_EXT2;
	  stfle_bits0_mask = S390_STFLE_BIT61_ARCH13_MIE3;
	}
      else if (tunable_str_comma_strcmp_cte (&t, "z13")
	       || tunable_str_comma_strcmp_cte (&t, "arch11"))
	{
	  reset_features = true;
	  disable = true;
	  hwcap_mask = HWCAP_S390_VXRS_EXT | HWCAP_S390_VXRS_EXT2;
	  stfle_bits0_mask = S390_STFLE_BIT61_ARCH13_MIE3;
	}
      else if (tunable_str_comma_strcmp_cte (&t, "z14")
	       || tunable_str_comma_strcmp_cte (&t, "arch12"))
	{
	  reset_features = true;
	  disable = true;
	  hwcap_mask = HWCAP_S390_VXRS_EXT2;
	  stfle_bits0_mask = S390_STFLE_BIT61_ARCH13_MIE3;
	}
      else if (tunable_str_comma_strcmp_cte (&t, "z15")
	       || tunable_str_comma_strcmp_cte (&t, "z16")
	       || tunable_str_comma_strcmp_cte (&t, "z17")
	       || tunable_str_comma_strcmp_cte (&t, "arch13")
	       || tunable_str_comma_strcmp_cte (&t, "arch14")
	       || tunable_str_comma_strcmp_cte (&t, "arch15"))
	{
	  /* For z15 or newer we don't have to disable something, but we have
	     to reset to the original values.  */
	  reset_features = true;
	}
      else if (tunable_str_comma_strcmp_cte (&t, "HWCAP_S390_VXRS"))
	{
	  hwcap_mask = HWCAP_S390_VXRS;
	  if (t.disable)
	    hwcap_mask |= HWCAP_S390_VXRS_EXT | HWCAP_S390_VXRS_EXT2;
	}
      else if (tunable_str_comma_strcmp_cte (&t, "HWCAP_S390_VXRS_EXT"))
	{
	  hwcap_mask = HWCAP_S390_VXRS_EXT;
	  if (t.disable)
	    hwcap_mask |= HWCAP_S390_VXRS_EXT2;
	  else
	    hwcap_mask |= HWCAP_S390_VXRS;
	}
      else if (tunable_str_comma_strcmp_cte (&t, "HWCAP_S390_VXRS_EXT2"))
	{
	  hwcap_mask = HWCAP_S390_VXRS_EXT2;
	  if (!t.disable)
	    hwcap_mask |= HWCAP_S390_VXRS | HWCAP_S390_VXRS_EXT;
	}
      else if (tunable_str_comma_strcmp_cte (&t, "STFLE_MIE3"))
	stfle_bits0_mask = S390_STFLE_BIT61_ARCH13_MIE3;
      /* Perform the actions determined above.  */
      if (reset_features)
	{
	  S390_COPY_CPU_FEATURES (&cpu_features_orig, &cpu_features_curr);
	}
      if (hwcap_mask != 0UL)
	{
	  if (disable)
	    cpu_features_curr.hwcap &= ~hwcap_mask;
	  else
	    cpu_features_curr.hwcap |= hwcap_mask;
	}
      if (stfle_bits0_mask != 0ULL)
	{
	  if (disable)
	    cpu_features_curr.stfle_filtered &= ~stfle_bits0_mask;
	  else
	    cpu_features_curr.stfle_filtered |= stfle_bits0_mask;
	}
    }
  /* Copy back the features after checking that no unsupported features were
     enabled by user.  */
  cpu_features->hwcap = cpu_features_curr.hwcap & cpu_features_orig.hwcap;
  cpu_features->stfle_filtered = cpu_features_curr.stfle_filtered
    & cpu_features_orig.stfle_filtered;
}
static inline void
init_cpu_features_no_tunables (struct cpu_features *cpu_features)
{
  /* Only initialize once.  */
  if (cpu_features->hwcap != 0)
    return;
  /* Fill cpu_features as passed by kernel and machine.  */
  cpu_features->hwcap = GLRO(dl_hwcap);
  /* We want just 1 double word to be returned.  */
  if (__glibc_likely ((cpu_features->hwcap & HWCAP_S390_STFLE)
		      && (cpu_features->hwcap & HWCAP_S390_ZARCH)
		      && (cpu_features->hwcap & HWCAP_S390_HIGH_GPRS)))
    {
      unsigned long long stfle_bits[4] = { 0 };
      register unsigned long reg0 __asm__("0") = 3;
      __asm__ __volatile__(".machine push"        "\n\t"
			   ".machine \"z9-109\""  "\n\t"
			   ".machinemode \"zarch_nohighgprs\"\n\t"
			   "stfle %0"             "\n\t"
			   ".machine pop"         "\n"
			   : "=QS" (stfle_bits[0]),
			     "+d" (reg0)
			   : : "cc");
      unsigned long long internal_stfle_bits = 0;
      /* Facility bit 34: z10: General instructions extension.  */
      if ((stfle_bits[0] & (1ULL << (63 - 34))) != 0)
	internal_stfle_bits |= S390_STFLE_BIT34_Z10;
      /* Facility bit 45: z196: Distinct operands, popcount, ...  */
      if ((stfle_bits[0] & (1ULL << (63 - 45))) != 0)
	internal_stfle_bits |= S390_STFLE_BIT45_Z196;
      /* Facility bit 61: arch13/z15: Miscellaneous-Instruction-Extensions
	 Facility 3, e.g. mvcrl.  */
      if ((stfle_bits[0] & (1ULL << (63 - 61))) != 0)
	internal_stfle_bits |= S390_STFLE_BIT61_ARCH13_MIE3;
      /* Facility bit 84: arch15/z17: Miscellaneous-instruction-extensions 4  */
      if ((stfle_bits[1] & (1ULL << (127 - 84))) != 0)
	internal_stfle_bits |= S390_STFLE_BIT84_ARCH15_MIE4;
      /* Facility bit 198: arch15/z17: Vector-enhancements-facility 3  */
      if ((stfle_bits[3] & (1ULL << (255 - 198))) != 0)
	internal_stfle_bits |= S390_STFLE_BIT198_ARCH15_VXRS_EXT3;
      /* Facility bit 199: arch15/z17: Vector-Packed-Decimal-Enhancement 3  */
      if ((stfle_bits[3] & (1ULL << (255 - 199))) != 0)
	internal_stfle_bits |= S390_STFLE_BIT199_ARCH15_VXRS_PDE3;
      /* Facility bit 201: arch15/z17: CPU: Concurrent-Functions Facility  */
      if ((stfle_bits[3] & (1ULL << (255 - 201))) != 0)
	internal_stfle_bits |= S390_STFLE_BIT201_ARCH15_CON;
      cpu_features->stfle_orig = internal_stfle_bits;
      cpu_features->stfle_filtered = internal_stfle_bits;
    }
}
static inline void
init_cpu_features (struct cpu_features *cpu_features)
{
  init_cpu_features_no_tunables (cpu_features);
  TUNABLE_GET (glibc, cpu, hwcaps, tunable_val_t *, TUNABLE_CALLBACK (set_hwcaps));
}