Blame - include/qemu/host-utils.h - people/peter.maydell/qemu-arm.git

blob: a3a7ced78da278bbad0a5a0a4bfbbfc95204b576 [file] [log] [blame]

ths	05f778c	2007-10-27 13:05:54 +0000	[diff] [blame]	1	/*
				2	* Utility compute operations used by translated code.
				3	*
				4	* Copyright (c) 2007 Thiemo Seufer
				5	* Copyright (c) 2007 Jocelyn Mayer
				6	*
				7	* Permission is hereby granted, free of charge, to any person obtaining a copy
				8	* of this software and associated documentation files (the "Software"), to deal
				9	* in the Software without restriction, including without limitation the rights
				10	* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
				11	* copies of the Software, and to permit persons to whom the Software is
				12	* furnished to do so, subject to the following conditions:
				13	*
				14	* The above copyright notice and this permission notice shall be included in
				15	* all copies or substantial portions of the Software.
				16	*
				17	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				18	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				19	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
				20	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				21	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				22	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
				23	* THE SOFTWARE.
				24	*/
Markus Armbruster	175de52	2016-06-29 15:29:06 +0200	[diff] [blame]	25
Luis Pires	8ac2d6c	2021-10-25 16:11:37 -0300	[diff] [blame]	26	/* Portions of this work are licensed under the terms of the GNU GPL,
				27	* version 2 or later. See the COPYING file in the top-level directory.
				28	*/
				29
Paolo Bonzini	cb9c377	2012-12-06 12:15:58 +0100	[diff] [blame]	30	#ifndef HOST_UTILS_H
Markus Armbruster	175de52	2016-06-29 15:29:06 +0200	[diff] [blame]	31	#define HOST_UTILS_H
ths	05f778c	2007-10-27 13:05:54 +0000	[diff] [blame]	32
Richard Henderson	1ec8070	2020-11-13 03:22:23 +0000	[diff] [blame]	33	#include "qemu/compiler.h"
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	34	#include "qemu/bswap.h"
ths	cebdff7	2008-06-05 22:55:54 +0000	[diff] [blame]	35
Richard Henderson	f540166	2013-02-16 12:46:59 -0800	[diff] [blame]	36	#ifdef CONFIG_INT128
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	37	static inline void mulu64(uint64_t plow, uint64_t phigh,
				38	uint64_t a, uint64_t b)
j_mayer	7a51ad8	2007-11-04 02:24:58 +0000	[diff] [blame]	39	{
Richard Henderson	f540166	2013-02-16 12:46:59 -0800	[diff] [blame]	40	__uint128_t r = (__uint128_t)a * b;
				41	*plow = r;
				42	*phigh = r >> 64;
j_mayer	7a51ad8	2007-11-04 02:24:58 +0000	[diff] [blame]	43	}
Richard Henderson	f540166	2013-02-16 12:46:59 -0800	[diff] [blame]	44
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	45	static inline void muls64(uint64_t plow, uint64_t phigh,
				46	int64_t a, int64_t b)
j_mayer	7a51ad8	2007-11-04 02:24:58 +0000	[diff] [blame]	47	{
Richard Henderson	f540166	2013-02-16 12:46:59 -0800	[diff] [blame]	48	__int128_t r = (__int128_t)a * b;
				49	*plow = r;
				50	*phigh = r >> 64;
j_mayer	7a51ad8	2007-11-04 02:24:58 +0000	[diff] [blame]	51	}
Tom Musta	98d1eb2	2014-01-07 10:05:51 -0600	[diff] [blame]	52
Peter Maydell	49caffe	2015-08-19 16:20:20 +0100	[diff] [blame]	53	/* compute with 96 bit intermediate result: (ab)/c /
				54	static inline uint64_t muldiv64(uint64_t a, uint32_t b, uint32_t c)
				55	{
				56	return (__int128_t)a * b / c;
				57	}
				58
Luis Pires	40f3e79	2021-10-25 16:11:38 -0300	[diff] [blame^]	59	static inline uint64_t divu128(uint64_t plow, uint64_t phigh,
				60	uint64_t divisor)
Tom Musta	98d1eb2	2014-01-07 10:05:51 -0600	[diff] [blame]	61	{
Luis Pires	9276a31	2021-10-25 16:11:36 -0300	[diff] [blame]	62	__uint128_t dividend = ((__uint128_t)phigh << 64) \| plow;
				63	__uint128_t result = dividend / divisor;
Luis Pires	40f3e79	2021-10-25 16:11:38 -0300	[diff] [blame^]	64
Luis Pires	9276a31	2021-10-25 16:11:36 -0300	[diff] [blame]	65	*plow = result;
Luis Pires	40f3e79	2021-10-25 16:11:38 -0300	[diff] [blame^]	66	*phigh = result >> 64;
				67	return dividend % divisor;
Tom Musta	98d1eb2	2014-01-07 10:05:51 -0600	[diff] [blame]	68	}
Tom Musta	e44259b	2014-01-07 10:05:52 -0600	[diff] [blame]	69
Luis Pires	40f3e79	2021-10-25 16:11:38 -0300	[diff] [blame^]	70	static inline int64_t divs128(uint64_t plow, int64_t phigh,
				71	int64_t divisor)
Tom Musta	e44259b	2014-01-07 10:05:52 -0600	[diff] [blame]	72	{
Luis Pires	40f3e79	2021-10-25 16:11:38 -0300	[diff] [blame^]	73	__int128_t dividend = ((__int128_t)phigh << 64) \| plow;
Luis Pires	9276a31	2021-10-25 16:11:36 -0300	[diff] [blame]	74	__int128_t result = dividend / divisor;
Luis Pires	40f3e79	2021-10-25 16:11:38 -0300	[diff] [blame^]	75
Luis Pires	9276a31	2021-10-25 16:11:36 -0300	[diff] [blame]	76	*plow = result;
Luis Pires	40f3e79	2021-10-25 16:11:38 -0300	[diff] [blame^]	77	*phigh = result >> 64;
				78	return dividend % divisor;
Tom Musta	e44259b	2014-01-07 10:05:52 -0600	[diff] [blame]	79	}
j_mayer	7a51ad8	2007-11-04 02:24:58 +0000	[diff] [blame]	80	#else
Lijun Pan	db7b62e	2020-07-01 18:43:44 -0500	[diff] [blame]	81	void muls64(uint64_t plow, uint64_t phigh, int64_t a, int64_t b);
				82	void mulu64(uint64_t plow, uint64_t phigh, uint64_t a, uint64_t b);
Luis Pires	40f3e79	2021-10-25 16:11:38 -0300	[diff] [blame^]	83	uint64_t divu128(uint64_t plow, uint64_t phigh, uint64_t divisor);
				84	int64_t divs128(uint64_t plow, int64_t phigh, int64_t divisor);
Peter Maydell	49caffe	2015-08-19 16:20:20 +0100	[diff] [blame]	85
				86	static inline uint64_t muldiv64(uint64_t a, uint32_t b, uint32_t c)
				87	{
				88	union {
				89	uint64_t ll;
				90	struct {
				91	#ifdef HOST_WORDS_BIGENDIAN
				92	uint32_t high, low;
				93	#else
				94	uint32_t low, high;
				95	#endif
				96	} l;
				97	} u, res;
				98	uint64_t rl, rh;
				99
				100	u.ll = a;
				101	rl = (uint64_t)u.l.low * (uint64_t)b;
				102	rh = (uint64_t)u.l.high * (uint64_t)b;
				103	rh += (rl >> 32);
				104	res.l.high = rh / c;
				105	res.l.low = (((rh % c) << 32) + (rl & 0xffffffff)) / c;
				106	return res.ll;
				107	}
j_mayer	7a51ad8	2007-11-04 02:24:58 +0000	[diff] [blame]	108	#endif
				109
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	110	/**
				111	* clz32 - count leading zeros in a 32-bit value.
				112	* @val: The value to search
				113	*
				114	* Returns 32 if the value is zero. Note that the GCC builtin is
				115	* undefined if the value is zero.
				116	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	117	static inline int clz32(uint32_t val)
ths	05f778c	2007-10-27 13:05:54 +0000	[diff] [blame]	118	{
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	119	return val ? __builtin_clz(val) : 32;
ths	05f778c	2007-10-27 13:05:54 +0000	[diff] [blame]	120	}
				121
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	122	/**
				123	* clo32 - count leading ones in a 32-bit value.
				124	* @val: The value to search
				125	*
				126	* Returns 32 if the value is -1.
				127	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	128	static inline int clo32(uint32_t val)
ths	05f778c	2007-10-27 13:05:54 +0000	[diff] [blame]	129	{
				130	return clz32(~val);
				131	}
				132
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	133	/**
				134	* clz64 - count leading zeros in a 64-bit value.
				135	* @val: The value to search
				136	*
				137	* Returns 64 if the value is zero. Note that the GCC builtin is
				138	* undefined if the value is zero.
				139	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	140	static inline int clz64(uint64_t val)
ths	05f778c	2007-10-27 13:05:54 +0000	[diff] [blame]	141	{
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	142	return val ? __builtin_clzll(val) : 64;
ths	05f778c	2007-10-27 13:05:54 +0000	[diff] [blame]	143	}
				144
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	145	/**
				146	* clo64 - count leading ones in a 64-bit value.
				147	* @val: The value to search
				148	*
				149	* Returns 64 if the value is -1.
				150	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	151	static inline int clo64(uint64_t val)
ths	05f778c	2007-10-27 13:05:54 +0000	[diff] [blame]	152	{
				153	return clz64(~val);
				154	}
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	155
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	156	/**
				157	* ctz32 - count trailing zeros in a 32-bit value.
				158	* @val: The value to search
				159	*
				160	* Returns 32 if the value is zero. Note that the GCC builtin is
				161	* undefined if the value is zero.
				162	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	163	static inline int ctz32(uint32_t val)
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	164	{
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	165	return val ? __builtin_ctz(val) : 32;
balrog	c890684	2008-11-12 17:18:41 +0000	[diff] [blame]	166	}
				167
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	168	/**
				169	* cto32 - count trailing ones in a 32-bit value.
				170	* @val: The value to search
				171	*
				172	* Returns 32 if the value is -1.
				173	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	174	static inline int cto32(uint32_t val)
balrog	c890684	2008-11-12 17:18:41 +0000	[diff] [blame]	175	{
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	176	return ctz32(~val);
				177	}
				178
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	179	/**
				180	* ctz64 - count trailing zeros in a 64-bit value.
				181	* @val: The value to search
				182	*
				183	* Returns 64 if the value is zero. Note that the GCC builtin is
				184	* undefined if the value is zero.
				185	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	186	static inline int ctz64(uint64_t val)
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	187	{
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	188	return val ? __builtin_ctzll(val) : 64;
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	189	}
				190
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	191	/**
Dr. David Alan Gilbert	1c884ab	2014-02-12 17:14:33 +0000	[diff] [blame]	192	* cto64 - count trailing ones in a 64-bit value.
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	193	* @val: The value to search
				194	*
				195	* Returns 64 if the value is -1.
				196	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	197	static inline int cto64(uint64_t val)
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	198	{
				199	return ctz64(~val);
				200	}
				201
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	202	/**
Claudio Fontana	afd3fe4	2013-12-17 19:42:35 +0000	[diff] [blame]	203	* clrsb32 - count leading redundant sign bits in a 32-bit value.
				204	* @val: The value to search
				205	*
				206	* Returns the number of bits following the sign bit that are equal to it.
				207	* No special cases; output range is [0-31].
				208	*/
				209	static inline int clrsb32(uint32_t val)
				210	{
Thomas Huth	f773b42	2018-12-03 14:33:12 +0100	[diff] [blame]	211	#if __has_builtin(__builtin_clrsb) \|\| !defined(__clang__)
Claudio Fontana	afd3fe4	2013-12-17 19:42:35 +0000	[diff] [blame]	212	return __builtin_clrsb(val);
				213	#else
				214	return clz32(val ^ ((int32_t)val >> 1)) - 1;
				215	#endif
				216	}
				217
				218	/**
				219	* clrsb64 - count leading redundant sign bits in a 64-bit value.
				220	* @val: The value to search
				221	*
				222	* Returns the number of bits following the sign bit that are equal to it.
				223	* No special cases; output range is [0-63].
				224	*/
				225	static inline int clrsb64(uint64_t val)
				226	{
Thomas Huth	f773b42	2018-12-03 14:33:12 +0100	[diff] [blame]	227	#if __has_builtin(__builtin_clrsbll) \|\| !defined(__clang__)
Claudio Fontana	afd3fe4	2013-12-17 19:42:35 +0000	[diff] [blame]	228	return __builtin_clrsbll(val);
				229	#else
				230	return clz64(val ^ ((int64_t)val >> 1)) - 1;
				231	#endif
				232	}
				233
				234	/**
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	235	* ctpop8 - count the population of one bits in an 8-bit value.
				236	* @val: The value to search
				237	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	238	static inline int ctpop8(uint8_t val)
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	239	{
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	240	return __builtin_popcount(val);
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	241	}
				242
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	243	/**
				244	* ctpop16 - count the population of one bits in a 16-bit value.
				245	* @val: The value to search
				246	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	247	static inline int ctpop16(uint16_t val)
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	248	{
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	249	return __builtin_popcount(val);
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	250	}
				251
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	252	/**
				253	* ctpop32 - count the population of one bits in a 32-bit value.
				254	* @val: The value to search
				255	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	256	static inline int ctpop32(uint32_t val)
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	257	{
aurel32	7d01998	2008-10-12 00:53:08 +0000	[diff] [blame]	258	return __builtin_popcount(val);
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	259	}
				260
Richard Henderson	72d8115	2013-02-13 17:47:35 -0800	[diff] [blame]	261	/**
				262	* ctpop64 - count the population of one bits in a 64-bit value.
				263	* @val: The value to search
				264	*/
Blue Swirl	facd285	2009-08-16 08:03:26 +0000	[diff] [blame]	265	static inline int ctpop64(uint64_t val)
j_mayer	b9ef45f	2007-10-28 12:52:38 +0000	[diff] [blame]	266	{
aurel32	7d01998	2008-10-12 00:53:08 +0000	[diff] [blame]	267	return __builtin_popcountll(val);
ths	3800af9	2007-12-18 01:58:05 +0000	[diff] [blame]	268	}
Paolo Bonzini	cb9c377	2012-12-06 12:15:58 +0100	[diff] [blame]	269
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	270	/**
				271	* revbit8 - reverse the bits in an 8-bit value.
				272	* @x: The value to modify.
				273	*/
				274	static inline uint8_t revbit8(uint8_t x)
				275	{
Richard Henderson	5140d6b	2020-11-06 10:59:36 -0800	[diff] [blame]	276	#if __has_builtin(__builtin_bitreverse8)
				277	return __builtin_bitreverse8(x);
				278	#else
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	279	/* Assign the correct nibble position. */
				280	x = ((x & 0xf0) >> 4)
				281	\| ((x & 0x0f) << 4);
				282	/* Assign the correct bit position. */
				283	x = ((x & 0x88) >> 3)
				284	\| ((x & 0x44) >> 1)
				285	\| ((x & 0x22) << 1)
				286	\| ((x & 0x11) << 3);
				287	return x;
Richard Henderson	5140d6b	2020-11-06 10:59:36 -0800	[diff] [blame]	288	#endif
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	289	}
				290
				291	/**
				292	* revbit16 - reverse the bits in a 16-bit value.
				293	* @x: The value to modify.
				294	*/
				295	static inline uint16_t revbit16(uint16_t x)
				296	{
Richard Henderson	5140d6b	2020-11-06 10:59:36 -0800	[diff] [blame]	297	#if __has_builtin(__builtin_bitreverse16)
				298	return __builtin_bitreverse16(x);
				299	#else
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	300	/* Assign the correct byte position. */
				301	x = bswap16(x);
				302	/* Assign the correct nibble position. */
				303	x = ((x & 0xf0f0) >> 4)
				304	\| ((x & 0x0f0f) << 4);
				305	/* Assign the correct bit position. */
				306	x = ((x & 0x8888) >> 3)
				307	\| ((x & 0x4444) >> 1)
				308	\| ((x & 0x2222) << 1)
				309	\| ((x & 0x1111) << 3);
				310	return x;
Richard Henderson	5140d6b	2020-11-06 10:59:36 -0800	[diff] [blame]	311	#endif
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	312	}
				313
				314	/**
				315	* revbit32 - reverse the bits in a 32-bit value.
				316	* @x: The value to modify.
				317	*/
				318	static inline uint32_t revbit32(uint32_t x)
				319	{
Richard Henderson	5140d6b	2020-11-06 10:59:36 -0800	[diff] [blame]	320	#if __has_builtin(__builtin_bitreverse32)
				321	return __builtin_bitreverse32(x);
				322	#else
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	323	/* Assign the correct byte position. */
				324	x = bswap32(x);
				325	/* Assign the correct nibble position. */
				326	x = ((x & 0xf0f0f0f0u) >> 4)
				327	\| ((x & 0x0f0f0f0fu) << 4);
				328	/* Assign the correct bit position. */
				329	x = ((x & 0x88888888u) >> 3)
				330	\| ((x & 0x44444444u) >> 1)
				331	\| ((x & 0x22222222u) << 1)
				332	\| ((x & 0x11111111u) << 3);
				333	return x;
Richard Henderson	5140d6b	2020-11-06 10:59:36 -0800	[diff] [blame]	334	#endif
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	335	}
				336
				337	/**
				338	* revbit64 - reverse the bits in a 64-bit value.
				339	* @x: The value to modify.
				340	*/
				341	static inline uint64_t revbit64(uint64_t x)
				342	{
Richard Henderson	5140d6b	2020-11-06 10:59:36 -0800	[diff] [blame]	343	#if __has_builtin(__builtin_bitreverse64)
				344	return __builtin_bitreverse64(x);
				345	#else
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	346	/* Assign the correct byte position. */
				347	x = bswap64(x);
				348	/* Assign the correct nibble position. */
				349	x = ((x & 0xf0f0f0f0f0f0f0f0ull) >> 4)
				350	\| ((x & 0x0f0f0f0f0f0f0f0full) << 4);
				351	/* Assign the correct bit position. */
				352	x = ((x & 0x8888888888888888ull) >> 3)
				353	\| ((x & 0x4444444444444444ull) >> 1)
				354	\| ((x & 0x2222222222222222ull) << 1)
				355	\| ((x & 0x1111111111111111ull) << 3);
				356	return x;
Richard Henderson	5140d6b	2020-11-06 10:59:36 -0800	[diff] [blame]	357	#endif
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	358	}
				359
Richard Henderson	cec07c0	2020-11-06 17:42:36 -0800	[diff] [blame]	360	/**
Luis Pires	d03bba0	2021-09-10 08:26:05 -0300	[diff] [blame]	361	* Return the absolute value of a 64-bit integer as an unsigned 64-bit value
				362	*/
				363	static inline uint64_t uabs64(int64_t v)
				364	{
				365	return v < 0 ? -v : v;
				366	}
				367
				368	/**
Richard Henderson	cec07c0	2020-11-06 17:42:36 -0800	[diff] [blame]	369	* sadd32_overflow - addition with overflow indication
				370	* @x, @y: addends
				371	* @ret: Output for sum
				372	*
				373	* Computes *@ret = @x + @y, and returns true if and only if that
				374	* value has been truncated.
				375	*/
				376	static inline bool sadd32_overflow(int32_t x, int32_t y, int32_t *ret)
				377	{
				378	#if __has_builtin(__builtin_add_overflow) \|\| __GNUC__ >= 5
				379	return __builtin_add_overflow(x, y, ret);
				380	#else
				381	*ret = x + y;
				382	return ((*ret ^ x) & ~(x ^ y)) < 0;
				383	#endif
				384	}
				385
				386	/**
				387	* sadd64_overflow - addition with overflow indication
				388	* @x, @y: addends
				389	* @ret: Output for sum
				390	*
				391	* Computes *@ret = @x + @y, and returns true if and only if that
				392	* value has been truncated.
				393	*/
				394	static inline bool sadd64_overflow(int64_t x, int64_t y, int64_t *ret)
				395	{
				396	#if __has_builtin(__builtin_add_overflow) \|\| __GNUC__ >= 5
				397	return __builtin_add_overflow(x, y, ret);
				398	#else
				399	*ret = x + y;
				400	return ((*ret ^ x) & ~(x ^ y)) < 0;
				401	#endif
				402	}
				403
				404	/**
				405	* uadd32_overflow - addition with overflow indication
				406	* @x, @y: addends
				407	* @ret: Output for sum
				408	*
				409	* Computes *@ret = @x + @y, and returns true if and only if that
				410	* value has been truncated.
				411	*/
				412	static inline bool uadd32_overflow(uint32_t x, uint32_t y, uint32_t *ret)
				413	{
				414	#if __has_builtin(__builtin_add_overflow) \|\| __GNUC__ >= 5
				415	return __builtin_add_overflow(x, y, ret);
				416	#else
				417	*ret = x + y;
				418	return *ret < x;
				419	#endif
				420	}
				421
				422	/**
				423	* uadd64_overflow - addition with overflow indication
				424	* @x, @y: addends
				425	* @ret: Output for sum
				426	*
				427	* Computes *@ret = @x + @y, and returns true if and only if that
				428	* value has been truncated.
				429	*/
				430	static inline bool uadd64_overflow(uint64_t x, uint64_t y, uint64_t *ret)
				431	{
				432	#if __has_builtin(__builtin_add_overflow) \|\| __GNUC__ >= 5
				433	return __builtin_add_overflow(x, y, ret);
				434	#else
				435	*ret = x + y;
				436	return *ret < x;
				437	#endif
				438	}
				439
				440	/**
				441	* ssub32_overflow - subtraction with overflow indication
				442	* @x: Minuend
				443	* @y: Subtrahend
				444	* @ret: Output for difference
				445	*
				446	* Computes *@ret = @x - @y, and returns true if and only if that
				447	* value has been truncated.
				448	*/
				449	static inline bool ssub32_overflow(int32_t x, int32_t y, int32_t *ret)
				450	{
				451	#if __has_builtin(__builtin_sub_overflow) \|\| __GNUC__ >= 5
				452	return __builtin_sub_overflow(x, y, ret);
				453	#else
				454	*ret = x - y;
				455	return ((*ret ^ x) & (x ^ y)) < 0;
				456	#endif
				457	}
				458
				459	/**
				460	* ssub64_overflow - subtraction with overflow indication
				461	* @x: Minuend
				462	* @y: Subtrahend
				463	* @ret: Output for sum
				464	*
				465	* Computes *@ret = @x - @y, and returns true if and only if that
				466	* value has been truncated.
				467	*/
				468	static inline bool ssub64_overflow(int64_t x, int64_t y, int64_t *ret)
				469	{
				470	#if __has_builtin(__builtin_sub_overflow) \|\| __GNUC__ >= 5
				471	return __builtin_sub_overflow(x, y, ret);
				472	#else
				473	*ret = x - y;
				474	return ((*ret ^ x) & (x ^ y)) < 0;
				475	#endif
				476	}
				477
				478	/**
				479	* usub32_overflow - subtraction with overflow indication
				480	* @x: Minuend
				481	* @y: Subtrahend
				482	* @ret: Output for sum
				483	*
				484	* Computes *@ret = @x - @y, and returns true if and only if that
				485	* value has been truncated.
				486	*/
				487	static inline bool usub32_overflow(uint32_t x, uint32_t y, uint32_t *ret)
				488	{
				489	#if __has_builtin(__builtin_sub_overflow) \|\| __GNUC__ >= 5
				490	return __builtin_sub_overflow(x, y, ret);
				491	#else
				492	*ret = x - y;
				493	return x < y;
				494	#endif
				495	}
				496
				497	/**
				498	* usub64_overflow - subtraction with overflow indication
				499	* @x: Minuend
				500	* @y: Subtrahend
				501	* @ret: Output for sum
				502	*
				503	* Computes *@ret = @x - @y, and returns true if and only if that
				504	* value has been truncated.
				505	*/
				506	static inline bool usub64_overflow(uint64_t x, uint64_t y, uint64_t *ret)
				507	{
				508	#if __has_builtin(__builtin_sub_overflow) \|\| __GNUC__ >= 5
				509	return __builtin_sub_overflow(x, y, ret);
				510	#else
				511	*ret = x - y;
				512	return x < y;
				513	#endif
				514	}
				515
				516	/**
				517	* smul32_overflow - multiplication with overflow indication
				518	* @x, @y: Input multipliers
				519	* @ret: Output for product
				520	*
				521	* Computes @ret = @x @y, and returns true if and only if that
				522	* value has been truncated.
				523	*/
				524	static inline bool smul32_overflow(int32_t x, int32_t y, int32_t *ret)
				525	{
				526	#if __has_builtin(__builtin_mul_overflow) \|\| __GNUC__ >= 5
				527	return __builtin_mul_overflow(x, y, ret);
				528	#else
				529	int64_t z = (int64_t)x * y;
				530	*ret = z;
				531	return *ret != z;
				532	#endif
				533	}
				534
				535	/**
				536	* smul64_overflow - multiplication with overflow indication
				537	* @x, @y: Input multipliers
				538	* @ret: Output for product
				539	*
				540	* Computes @ret = @x @y, and returns true if and only if that
				541	* value has been truncated.
				542	*/
				543	static inline bool smul64_overflow(int64_t x, int64_t y, int64_t *ret)
				544	{
				545	#if __has_builtin(__builtin_mul_overflow) \|\| __GNUC__ >= 5
				546	return __builtin_mul_overflow(x, y, ret);
				547	#else
				548	uint64_t hi, lo;
				549	muls64(&lo, &hi, x, y);
				550	*ret = lo;
				551	return hi != ((int64_t)lo >> 63);
				552	#endif
				553	}
				554
				555	/**
				556	* umul32_overflow - multiplication with overflow indication
				557	* @x, @y: Input multipliers
				558	* @ret: Output for product
				559	*
				560	* Computes @ret = @x @y, and returns true if and only if that
				561	* value has been truncated.
				562	*/
				563	static inline bool umul32_overflow(uint32_t x, uint32_t y, uint32_t *ret)
				564	{
				565	#if __has_builtin(__builtin_mul_overflow) \|\| __GNUC__ >= 5
				566	return __builtin_mul_overflow(x, y, ret);
				567	#else
				568	uint64_t z = (uint64_t)x * y;
				569	*ret = z;
				570	return z > UINT32_MAX;
				571	#endif
				572	}
				573
				574	/**
				575	* umul64_overflow - multiplication with overflow indication
				576	* @x, @y: Input multipliers
				577	* @ret: Output for product
				578	*
				579	* Computes @ret = @x @y, and returns true if and only if that
				580	* value has been truncated.
				581	*/
				582	static inline bool umul64_overflow(uint64_t x, uint64_t y, uint64_t *ret)
				583	{
				584	#if __has_builtin(__builtin_mul_overflow) \|\| __GNUC__ >= 5
				585	return __builtin_mul_overflow(x, y, ret);
				586	#else
				587	uint64_t hi;
				588	mulu64(ret, &hi, x, y);
				589	return hi != 0;
				590	#endif
				591	}
				592
Richard Henderson	1ec8070	2020-11-13 03:22:23 +0000	[diff] [blame]	593	/**
				594	* uadd64_carry - addition with carry-in and carry-out
				595	* @x, @y: addends
				596	* @pcarry: in-out carry value
				597	*
				598	* Computes @x + @y + *@pcarry, placing the carry-out back
				599	* into *@pcarry and returning the 64-bit sum.
				600	*/
				601	static inline uint64_t uadd64_carry(uint64_t x, uint64_t y, bool *pcarry)
				602	{
				603	#if __has_builtin(__builtin_addcll)
				604	unsigned long long c = *pcarry;
				605	x = __builtin_addcll(x, y, c, &c);
				606	*pcarry = c & 1;
				607	return x;
				608	#else
				609	bool c = *pcarry;
				610	/* This is clang's internal expansion of __builtin_addc. */
				611	c = uadd64_overflow(x, c, &x);
				612	c \|= uadd64_overflow(x, y, &x);
				613	*pcarry = c;
				614	return x;
				615	#endif
				616	}
				617
				618	/**
				619	* usub64_borrow - subtraction with borrow-in and borrow-out
				620	* @x, @y: addends
				621	* @pborrow: in-out borrow value
				622	*
				623	* Computes @x - @y - *@pborrow, placing the borrow-out back
				624	* into *@pborrow and returning the 64-bit sum.
				625	*/
				626	static inline uint64_t usub64_borrow(uint64_t x, uint64_t y, bool *pborrow)
				627	{
				628	#if __has_builtin(__builtin_subcll)
				629	unsigned long long b = *pborrow;
				630	x = __builtin_subcll(x, y, b, &b);
				631	*pborrow = b & 1;
				632	return x;
				633	#else
				634	bool b = *pborrow;
				635	b = usub64_overflow(x, b, &x);
				636	b \|= usub64_overflow(x, y, &x);
				637	*pborrow = b;
				638	return x;
				639	#endif
				640	}
				641
Richard Henderson	0165437	2013-02-13 17:47:34 -0800	[diff] [blame]	642	/* Host type specific sizes of these routines. */
				643
				644	#if ULONG_MAX == UINT32_MAX
				645	# define clzl clz32
				646	# define ctzl ctz32
				647	# define clol clo32
				648	# define ctol cto32
				649	# define ctpopl ctpop32
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	650	# define revbitl revbit32
Richard Henderson	0165437	2013-02-13 17:47:34 -0800	[diff] [blame]	651	#elif ULONG_MAX == UINT64_MAX
				652	# define clzl clz64
				653	# define ctzl ctz64
				654	# define clol clo64
				655	# define ctol cto64
				656	# define ctpopl ctpop64
Richard Henderson	652a4b7	2015-09-14 13:00:34 -0700	[diff] [blame]	657	# define revbitl revbit64
Richard Henderson	0165437	2013-02-13 17:47:34 -0800	[diff] [blame]	658	#else
				659	# error Unknown sizeof long
				660	#endif
				661
Peter Maydell	8f1ed5f	2015-07-24 13:33:12 +0100	[diff] [blame]	662	static inline bool is_power_of_2(uint64_t value)
				663	{
				664	if (!value) {
Eric Blake	e52eeb4	2016-05-31 12:33:31 -0600	[diff] [blame]	665	return false;
Peter Maydell	8f1ed5f	2015-07-24 13:33:12 +0100	[diff] [blame]	666	}
				667
				668	return !(value & (value - 1));
				669	}
				670
Markus Armbruster	43c64a0	2017-07-27 11:46:15 +0200	[diff] [blame]	671	/**
				672	* Return @value rounded down to the nearest power of two or zero.
				673	*/
				674	static inline uint64_t pow2floor(uint64_t value)
Peter Maydell	8f1ed5f	2015-07-24 13:33:12 +0100	[diff] [blame]	675	{
Markus Armbruster	43c64a0	2017-07-27 11:46:15 +0200	[diff] [blame]	676	if (!value) {
				677	/* Avoid undefined shift by 64 */
				678	return 0;
Peter Maydell	8f1ed5f	2015-07-24 13:33:12 +0100	[diff] [blame]	679	}
Markus Armbruster	43c64a0	2017-07-27 11:46:15 +0200	[diff] [blame]	680	return 0x8000000000000000ull >> clz64(value);
Peter Maydell	8f1ed5f	2015-07-24 13:33:12 +0100	[diff] [blame]	681	}
				682
Markus Armbruster	362aaf1	2017-07-27 11:46:16 +0200	[diff] [blame]	683	/*
				684	* Return @value rounded up to the nearest power of two modulo 2^64.
				685	* This is zero for @value > 2^63, so be careful.
				686	*/
Peter Maydell	8f1ed5f	2015-07-24 13:33:12 +0100	[diff] [blame]	687	static inline uint64_t pow2ceil(uint64_t value)
				688	{
Markus Armbruster	362aaf1	2017-07-27 11:46:16 +0200	[diff] [blame]	689	int n = clz64(value - 1);
Peter Maydell	8f1ed5f	2015-07-24 13:33:12 +0100	[diff] [blame]	690
Markus Armbruster	362aaf1	2017-07-27 11:46:16 +0200	[diff] [blame]	691	if (!n) {
				692	/*
				693	* @value - 1 has no leading zeroes, thus @value - 1 >= 2^63
				694	* Therefore, either @value == 0 or @value > 2^63.
				695	* If it's 0, return 1, else return 0.
				696	*/
				697	return !value;
Peter Maydell	8f1ed5f	2015-07-24 13:33:12 +0100	[diff] [blame]	698	}
Markus Armbruster	362aaf1	2017-07-27 11:46:16 +0200	[diff] [blame]	699	return 0x8000000000000000ull >> (n - 1);
Peter Maydell	8f1ed5f	2015-07-24 13:33:12 +0100	[diff] [blame]	700	}
				701
Yuval Shaia	37e626c	2018-01-14 11:01:43 +0200	[diff] [blame]	702	static inline uint32_t pow2roundup32(uint32_t x)
				703	{
				704	x \|= (x >> 1);
				705	x \|= (x >> 2);
				706	x \|= (x >> 4);
				707	x \|= (x >> 8);
				708	x \|= (x >> 16);
				709	return x + 1;
				710	}
				711
Jose Ricardo Ziviani	f539fbe	2017-01-10 00:10:09 -0200	[diff] [blame]	712	/**
				713	* urshift - 128-bit Unsigned Right Shift.
				714	* @plow: in/out - lower 64-bit integer.
				715	* @phigh: in/out - higher 64-bit integer.
				716	* @shift: in - bytes to shift, between 0 and 127.
				717	*
				718	* Result is zero-extended and stored in plow/phigh, which are
				719	* input/output variables. Shift values outside the range will
				720	* be mod to 128. In other words, the caller is responsible to
				721	* verify/assert both the shift range and plow/phigh pointers.
				722	*/
				723	void urshift(uint64_t plow, uint64_t phigh, int32_t shift);
				724
				725	/**
				726	* ulshift - 128-bit Unsigned Left Shift.
				727	* @plow: in/out - lower 64-bit integer.
				728	* @phigh: in/out - higher 64-bit integer.
				729	* @shift: in - bytes to shift, between 0 and 127.
				730	* @overflow: out - true if any 1-bit is shifted out.
				731	*
				732	* Result is zero-extended and stored in plow/phigh, which are
				733	* input/output variables. Shift values outside the range will
				734	* be mod to 128. In other words, the caller is responsible to
				735	* verify/assert both the shift range and plow/phigh pointers.
				736	*/
				737	void ulshift(uint64_t plow, uint64_t phigh, int32_t shift, bool *overflow);
				738
Luis Pires	8ac2d6c	2021-10-25 16:11:37 -0300	[diff] [blame]	739	/* From the GNU Multi Precision Library - longlong.h __udiv_qrnnd
				740	* (https://gmplib.org/repo/gmp/file/tip/longlong.h)
				741	*
				742	* Licensed under the GPLv2/LGPLv3
				743	*/
				744	static inline uint64_t udiv_qrnnd(uint64_t *r, uint64_t n1,
				745	uint64_t n0, uint64_t d)
				746	{
				747	#if defined(__x86_64__)
				748	uint64_t q;
				749	asm("divq %4" : "=a"(q), "=d"(*r) : "0"(n0), "1"(n1), "rm"(d));
				750	return q;
				751	#elif defined(__s390x__) && !defined(__clang__)
				752	/* Need to use a TImode type to get an even register pair for DLGR. */
				753	unsigned __int128 n = (unsigned __int128)n1 << 64 \| n0;
				754	asm("dlgr %0, %1" : "+r"(n) : "r"(d));
				755	*r = n >> 64;
				756	return n;
				757	#elif defined(_ARCH_PPC64) && defined(_ARCH_PWR7)
				758	/* From Power ISA 2.06, programming note for divdeu. */
				759	uint64_t q1, q2, Q, r1, r2, R;
				760	asm("divdeu %0,%2,%4; divdu %1,%3,%4"
				761	: "=&r"(q1), "=r"(q2)
				762	: "r"(n1), "r"(n0), "r"(d));
				763	r1 = -(q1 * d); /* low part of (n1<<64) - (q1 * d) */
				764	r2 = n0 - (q2 * d);
				765	Q = q1 + q2;
				766	R = r1 + r2;
				767	if (R >= d \|\| R < r2) { /* overflow implies R > d */
				768	Q += 1;
				769	R -= d;
				770	}
				771	*r = R;
				772	return Q;
				773	#else
				774	uint64_t d0, d1, q0, q1, r1, r0, m;
				775
				776	d0 = (uint32_t)d;
				777	d1 = d >> 32;
				778
				779	r1 = n1 % d1;
				780	q1 = n1 / d1;
				781	m = q1 * d0;
				782	r1 = (r1 << 32) \| (n0 >> 32);
				783	if (r1 < m) {
				784	q1 -= 1;
				785	r1 += d;
				786	if (r1 >= d) {
				787	if (r1 < m) {
				788	q1 -= 1;
				789	r1 += d;
				790	}
				791	}
				792	}
				793	r1 -= m;
				794
				795	r0 = r1 % d1;
				796	q0 = r1 / d1;
				797	m = q0 * d0;
				798	r0 = (r0 << 32) \| (uint32_t)n0;
				799	if (r0 < m) {
				800	q0 -= 1;
				801	r0 += d;
				802	if (r0 >= d) {
				803	if (r0 < m) {
				804	q0 -= 1;
				805	r0 += d;
				806	}
				807	}
				808	}
				809	r0 -= m;
				810
				811	*r = r0;
				812	return (q1 << 32) \| q0;
				813	#endif
				814	}
				815
Paolo Bonzini	cb9c377	2012-12-06 12:15:58 +0100	[diff] [blame]	816	#endif