libgcc/config/gcn/lib2-vec_divmod-hi.c - gcc - Git at Google

 /* Copyright (C) 2012-2023 Free Software Foundation, Inc.
    Contributed by Altera and Mentor Graphics, Inc.

 This file is free software; you can redistribute it and/or modify it
 under the terms of the GNU General Public License as published by the
 Free Software Foundation; either version 3, or (at your option) any
 later version.

 This file is distributed in the hope that it will be useful, but
 WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 General Public License for more details.

 Under Section 7 of GPL version 3, you are granted additional
 permissions described in the GCC Runtime Library Exception, version
 3.1, as published by the Free Software Foundation.

 You should have received a copy of the GNU General Public License and
 a copy of the GCC Runtime Library Exception along with this program;
 see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
 <http://www.gnu.org/licenses/>.  */

 #include "lib2-gcn.h"

 /* 16-bit V64HI divide and modulo as used in gcn.
    This is a simple conversion from lib2-divmod.c.  */

 #define MASKMODE v64hi
 #include "amdgcn_veclib.h"

 static v64udi
 __udivmodv64hi4_aux (v64uhi num, v64uhi den, v64hi __mask)
 {
   v64uhi bit = VECTOR_INIT ((unsigned short)1U);
   v64uhi res = VECTOR_INIT ((unsigned short)0U);

   VECTOR_WHILE ((den < num) & (bit != 0) & ((den & (1L<<15)) == 0),
 		cond, NO_COND)
     VECTOR_COND_MOVE (den, den << 1, cond);
     VECTOR_COND_MOVE (bit, bit << 1, cond);
   VECTOR_ENDWHILE
   VECTOR_WHILE (bit != 0, loopcond, NO_COND)
     VECTOR_IF2 (num >= den, ifcond, loopcond)
       VECTOR_COND_MOVE (num, num - den, ifcond);
       VECTOR_COND_MOVE (res, res | bit, ifcond);
     VECTOR_ENDIF
     VECTOR_COND_MOVE (bit, bit >> 1, loopcond);
     VECTOR_COND_MOVE (den, den >> 1, loopcond);
   VECTOR_ENDWHILE

   return PACK_SI_PAIR (res, num);
 }

 static v64udi
 __divmodv64hi4_aux (v64hi a, v64hi b,  v64hi __mask)
 {
   v64hi nega = VECTOR_INIT ((short)0);
   v64hi negb = VECTOR_INIT ((short)0);

   VECTOR_IF (a < 0, cond)
     VECTOR_COND_MOVE (a, -a, cond);
     nega = cond;
   VECTOR_ENDIF

   VECTOR_IF (b < 0, cond)
     VECTOR_COND_MOVE (b, -b, cond);
     negb = cond;
   VECTOR_ENDIF

   v64uhi ua = __builtin_convertvector (a, v64uhi);
   v64uhi ub = __builtin_convertvector (b, v64uhi);
   v64udi pair = __udivmodv64hi4_aux (ua, ub, __mask);

   v64hi quot = UNPACK_SI_LOW (v64hi, pair);
   v64hi rem = UNPACK_SI_HIGH (v64hi, pair);
   VECTOR_COND_MOVE (quot, -quot, nega ^ negb);
   VECTOR_COND_MOVE (rem, -rem, nega);
   pair = PACK_SI_PAIR (quot, rem);

   return pair;
 }


 static inline v64hi
 __divv64hi3_aux (v64hi a, v64hi b, v64hi __mask)
 {
   v64udi pair = __divmodv64hi4_aux (a, b, __mask);
   return UNPACK_SI_LOW (v64hi, pair);
 }

 static inline v64hi
 __modv64hi3_aux (v64hi a, v64hi b, v64hi __mask)
 {
   v64udi pair = __divmodv64hi4_aux (a, b, __mask);
   return UNPACK_SI_HIGH (v64hi, pair);
 }


 static inline v64uhi
 __udivv64hi3_aux (v64uhi a, v64uhi b, v64hi __mask)
 {
   v64udi pair = __udivmodv64hi4_aux (a, b, __mask);
   return UNPACK_SI_LOW (v64uhi, pair);
 }

 static inline v64uhi
 __umodv64hi3_aux (v64uhi a, v64uhi b, v64hi __mask)
 {
   v64udi pair = __udivmodv64hi4_aux (a, b, __mask);
   return UNPACK_SI_HIGH (v64uhi, pair);
 }

 DEF_VARIANTS (__div, hi3, hi)
 DEF_VARIANTS (__mod, hi3, hi)
 DEF_VARIANTS_B (__divmod, hi4, udi, hi)
 DEF_VARIANTS (__udiv, hi3, uhi)
 DEF_VARIANTS (__umod, hi3, uhi)
 DEF_VARIANTS_B (__udivmod, hi4, udi, uhi)
	/* Copyright (C) 2012-2023 Free Software Foundation, Inc.
	Contributed by Altera and Mentor Graphics, Inc.

	This file is free software; you can redistribute it and/or modify it
	under the terms of the GNU General Public License as published by the
	Free Software Foundation; either version 3, or (at your option) any
	later version.

	This file is distributed in the hope that it will be useful, but
	WITHOUT ANY WARRANTY; without even the implied warranty of
	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	General Public License for more details.

	Under Section 7 of GPL version 3, you are granted additional
	permissions described in the GCC Runtime Library Exception, version
	3.1, as published by the Free Software Foundation.

	You should have received a copy of the GNU General Public License and
	a copy of the GCC Runtime Library Exception along with this program;
	see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
	<http://www.gnu.org/licenses/>. */

	#include "lib2-gcn.h"

	/* 16-bit V64HI divide and modulo as used in gcn.
	This is a simple conversion from lib2-divmod.c. */

	#define MASKMODE v64hi
	#include "amdgcn_veclib.h"

	static v64udi
	__udivmodv64hi4_aux (v64uhi num, v64uhi den, v64hi __mask)
	{
	v64uhi bit = VECTOR_INIT ((unsigned short)1U);
	v64uhi res = VECTOR_INIT ((unsigned short)0U);

	VECTOR_WHILE ((den < num) & (bit != 0) & ((den & (1L<<15)) == 0),
	cond, NO_COND)
	VECTOR_COND_MOVE (den, den << 1, cond);
	VECTOR_COND_MOVE (bit, bit << 1, cond);
	VECTOR_ENDWHILE
	VECTOR_WHILE (bit != 0, loopcond, NO_COND)
	VECTOR_IF2 (num >= den, ifcond, loopcond)
	VECTOR_COND_MOVE (num, num - den, ifcond);
	VECTOR_COND_MOVE (res, res \| bit, ifcond);
	VECTOR_ENDIF
	VECTOR_COND_MOVE (bit, bit >> 1, loopcond);
	VECTOR_COND_MOVE (den, den >> 1, loopcond);
	VECTOR_ENDWHILE

	return PACK_SI_PAIR (res, num);
	}

	static v64udi
	__divmodv64hi4_aux (v64hi a, v64hi b, v64hi __mask)
	{
	v64hi nega = VECTOR_INIT ((short)0);
	v64hi negb = VECTOR_INIT ((short)0);

	VECTOR_IF (a < 0, cond)
	VECTOR_COND_MOVE (a, -a, cond);
	nega = cond;
	VECTOR_ENDIF

	VECTOR_IF (b < 0, cond)
	VECTOR_COND_MOVE (b, -b, cond);
	negb = cond;
	VECTOR_ENDIF

	v64uhi ua = __builtin_convertvector (a, v64uhi);
	v64uhi ub = __builtin_convertvector (b, v64uhi);
	v64udi pair = __udivmodv64hi4_aux (ua, ub, __mask);

	v64hi quot = UNPACK_SI_LOW (v64hi, pair);
	v64hi rem = UNPACK_SI_HIGH (v64hi, pair);
	VECTOR_COND_MOVE (quot, -quot, nega ^ negb);
	VECTOR_COND_MOVE (rem, -rem, nega);
	pair = PACK_SI_PAIR (quot, rem);

	return pair;
	}


	static inline v64hi
	__divv64hi3_aux (v64hi a, v64hi b, v64hi __mask)
	{
	v64udi pair = __divmodv64hi4_aux (a, b, __mask);
	return UNPACK_SI_LOW (v64hi, pair);
	}

	static inline v64hi
	__modv64hi3_aux (v64hi a, v64hi b, v64hi __mask)
	{
	v64udi pair = __divmodv64hi4_aux (a, b, __mask);
	return UNPACK_SI_HIGH (v64hi, pair);
	}


	static inline v64uhi
	__udivv64hi3_aux (v64uhi a, v64uhi b, v64hi __mask)
	{
	v64udi pair = __udivmodv64hi4_aux (a, b, __mask);
	return UNPACK_SI_LOW (v64uhi, pair);
	}

	static inline v64uhi
	__umodv64hi3_aux (v64uhi a, v64uhi b, v64hi __mask)
	{
	v64udi pair = __udivmodv64hi4_aux (a, b, __mask);
	return UNPACK_SI_HIGH (v64uhi, pair);
	}

	DEF_VARIANTS (__div, hi3, hi)
	DEF_VARIANTS (__mod, hi3, hi)
	DEF_VARIANTS_B (__divmod, hi4, udi, hi)
	DEF_VARIANTS (__udiv, hi3, uhi)
	DEF_VARIANTS (__umod, hi3, uhi)
	DEF_VARIANTS_B (__udivmod, hi4, udi, uhi)