mirror of
				https://sourceware.org/git/glibc.git
				synced 2025-11-03 20:53:13 +03:00 
			
		
		
		
	POWER ISA 3.0 introduces the xssqrtqp instructions, which expects operands to be in Vector Registers (Altivec/VMX), even though this instruction belongs to the Vector-Scalar Instruction Set. In GCC's Extended Assembly for POWER, the 'wq' register constraint is provided for use with IEEE 754 128-bit floating-point values. However, this constraint does not limit the register allocation to Vector Registers (Altivec/VMX) and could assign a Vector-Scalar Register (VSX) to the operands of the instruction. This patch changes the register constraint used in sqrtf128 from 'wq' to 'v', in order to request a Vector Register (Altivec/VMX) for use with the xssqrtqp instruction. Tested for powerpc64le and --with-cpu=power9. [BZ #21941] * sysdeps/powerpc/fpu/math_private.h (__ieee754_sqrtf128): Since xssqrtqp requires operands to be in Vector Registers (Altivec/VMX), replace the register constraint 'wq' with 'v'. * sysdeps/powerpc/powerpc64le/power9/fpu/e_sqrtf128.c (__ieee754_sqrtf128): Likewise.
		
			
				
	
	
		
			153 lines
		
	
	
		
			3.2 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			153 lines
		
	
	
		
			3.2 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/* Private inline math functions for powerpc.
 | 
						|
   Copyright (C) 2006-2017 Free Software Foundation, Inc.
 | 
						|
   This file is part of the GNU C Library.
 | 
						|
 | 
						|
   The GNU C Library is free software; you can redistribute it and/or
 | 
						|
   modify it under the terms of the GNU Lesser General Public
 | 
						|
   License as published by the Free Software Foundation; either
 | 
						|
   version 2.1 of the License, or (at your option) any later version.
 | 
						|
 | 
						|
   The GNU C Library is distributed in the hope that it will be useful,
 | 
						|
   but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | 
						|
   Lesser General Public License for more details.
 | 
						|
 | 
						|
   You should have received a copy of the GNU Lesser General Public
 | 
						|
   License along with the GNU C Library; if not, see
 | 
						|
   <http://www.gnu.org/licenses/>.  */
 | 
						|
 | 
						|
#ifndef _PPC_MATH_PRIVATE_H_
 | 
						|
#define _PPC_MATH_PRIVATE_H_
 | 
						|
 | 
						|
#include <sysdep.h>
 | 
						|
#include <ldsodefs.h>
 | 
						|
#include <dl-procinfo.h>
 | 
						|
#include <fenv_private.h>
 | 
						|
#include_next <math_private.h>
 | 
						|
 | 
						|
#if defined _ARCH_PWR9 && __HAVE_DISTINCT_FLOAT128
 | 
						|
extern __always_inline _Float128
 | 
						|
__ieee754_sqrtf128 (_Float128 __x)
 | 
						|
{
 | 
						|
  _Float128 __z;
 | 
						|
  asm ("xssqrtqp %0,%1" : "=v" (__z) : "v" (__x));
 | 
						|
  return __z;
 | 
						|
}
 | 
						|
#endif
 | 
						|
 | 
						|
extern double __slow_ieee754_sqrt (double);
 | 
						|
extern __always_inline double
 | 
						|
__ieee754_sqrt (double __x)
 | 
						|
{
 | 
						|
  double __z;
 | 
						|
 | 
						|
#ifdef _ARCH_PPCSQ
 | 
						|
   asm ("fsqrt	%0,%1" : "=f" (__z) : "f" (__x));
 | 
						|
#else
 | 
						|
   __z = __slow_ieee754_sqrt(__x);
 | 
						|
#endif
 | 
						|
 | 
						|
  return __z;
 | 
						|
}
 | 
						|
 | 
						|
extern float __slow_ieee754_sqrtf (float);
 | 
						|
extern __always_inline float
 | 
						|
__ieee754_sqrtf (float __x)
 | 
						|
{
 | 
						|
  float __z;
 | 
						|
 | 
						|
#ifdef _ARCH_PPCSQ
 | 
						|
  asm ("fsqrts	%0,%1" : "=f" (__z) : "f" (__x));
 | 
						|
#else
 | 
						|
   __z = __slow_ieee754_sqrtf(__x);
 | 
						|
#endif
 | 
						|
 | 
						|
  return __z;
 | 
						|
}
 | 
						|
 | 
						|
#if defined _ARCH_PWR5X
 | 
						|
 | 
						|
# ifndef __round
 | 
						|
#  define __round(x)			\
 | 
						|
    ({ double __z;			\
 | 
						|
      __asm __volatile (		\
 | 
						|
	"	frin %0,%1\n"		\
 | 
						|
		: "=f" (__z)		\
 | 
						|
		: "f" (x));		\
 | 
						|
     __z; })
 | 
						|
# endif
 | 
						|
# ifndef __roundf
 | 
						|
#  define __roundf(x)			\
 | 
						|
    ({ float __z;			\
 | 
						|
     __asm __volatile (			\
 | 
						|
	"	frin %0,%1\n"		\
 | 
						|
	"	frsp %0,%0\n"		\
 | 
						|
		: "=f" (__z)		\
 | 
						|
		: "f" (x));		\
 | 
						|
     __z; })
 | 
						|
# endif
 | 
						|
 | 
						|
# ifndef __trunc
 | 
						|
#  define __trunc(x)			\
 | 
						|
    ({ double __z;			\
 | 
						|
     __asm __volatile (			\
 | 
						|
	"	friz %0,%1\n"		\
 | 
						|
		: "=f" (__z)		\
 | 
						|
		: "f" (x));		\
 | 
						|
     __z; })
 | 
						|
# endif
 | 
						|
# ifndef __truncf
 | 
						|
#  define __truncf(x)			\
 | 
						|
    ({ float __z;			\
 | 
						|
     __asm __volatile (			\
 | 
						|
	"	friz %0,%1\n"		\
 | 
						|
	"	frsp %0,%0\n"		\
 | 
						|
		: "=f" (__z)		\
 | 
						|
		: "f" (x));		\
 | 
						|
     __z; })
 | 
						|
# endif
 | 
						|
 | 
						|
# ifndef __ceil
 | 
						|
#  define __ceil(x)			\
 | 
						|
    ({ double __z;			\
 | 
						|
     __asm __volatile (			\
 | 
						|
	"	frip %0,%1\n"		\
 | 
						|
		: "=f" (__z)		\
 | 
						|
		: "f" (x));		\
 | 
						|
     __z; })
 | 
						|
# endif
 | 
						|
# ifndef __ceilf
 | 
						|
#  define __ceilf(x)			\
 | 
						|
    ({ float __z;			\
 | 
						|
     __asm __volatile (			\
 | 
						|
	"	frip %0,%1\n"		\
 | 
						|
	"	frsp %0,%0\n"		\
 | 
						|
		: "=f" (__z)		\
 | 
						|
		: "f" (x));		\
 | 
						|
     __z; })
 | 
						|
# endif
 | 
						|
 | 
						|
# ifndef __floor
 | 
						|
#  define __floor(x)			\
 | 
						|
    ({ double __z;			\
 | 
						|
     __asm __volatile (			\
 | 
						|
	"	frim %0,%1\n"		\
 | 
						|
		: "=f" (__z)		\
 | 
						|
		: "f" (x));		\
 | 
						|
     __z; })
 | 
						|
# endif
 | 
						|
# ifndef __floorf
 | 
						|
#  define __floorf(x)			\
 | 
						|
    ({ float __z;			\
 | 
						|
     __asm __volatile (			\
 | 
						|
	"	frim %0,%1\n"		\
 | 
						|
	"	frsp %0,%0\n"		\
 | 
						|
		: "=f" (__z)		\
 | 
						|
		: "f" (x));		\
 | 
						|
     __z; })
 | 
						|
# endif
 | 
						|
 | 
						|
#endif	/* defined _ARCH_PWR5X */
 | 
						|
 | 
						|
#endif /* _PPC_MATH_PRIVATE_H_ */
 |