195 lines
4.6 KiB
C
195 lines
4.6 KiB
C
/////////////////////////////////////////////////////////////////////////
|
|
// $Id$
|
|
/////////////////////////////////////////////////////////////////////////
|
|
//
|
|
// Copyright (c) 2014 Stanislav Shwartsman
|
|
// Written by Stanislav Shwartsman [sshwarts at sourceforge net]
|
|
//
|
|
// This library is free software; you can redistribute it and/or
|
|
// modify it under the terms of the GNU Lesser General Public
|
|
// License as published by the Free Software Foundation; either
|
|
// version 2 of the License, or (at your option) any later version.
|
|
//
|
|
// This library is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
// Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public
|
|
// License along with this library; if not, write to the Free Software
|
|
// Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA B 02110-1301 USA
|
|
//
|
|
/////////////////////////////////////////////////////////////////////////
|
|
|
|
#ifndef BX_SCALAR_ARITH_FUNCTIONS_H
|
|
#define BX_SCALAR_ARITH_FUNCTIONS_H
|
|
|
|
// parity
|
|
|
|
BX_CPP_INLINE unsigned parity_byte(Bit8u val_8)
|
|
{
|
|
return (0x9669 >> ((val_8 ^ (val_8 >> 4)) & 0xF)) & 1;
|
|
}
|
|
|
|
// tzcnt
|
|
|
|
BX_CPP_INLINE unsigned tzcntw(Bit16u val_16)
|
|
{
|
|
Bit16u mask = 0x1;
|
|
unsigned count = 0;
|
|
|
|
while ((val_16 & mask) == 0 && mask) {
|
|
mask <<= 1;
|
|
count++;
|
|
}
|
|
|
|
return count;
|
|
}
|
|
|
|
BX_CPP_INLINE unsigned tzcntd(Bit32u val_32)
|
|
{
|
|
Bit32u mask = 0x1;
|
|
unsigned count = 0;
|
|
|
|
while ((val_32 & mask) == 0 && mask) {
|
|
mask <<= 1;
|
|
count++;
|
|
}
|
|
|
|
return count;
|
|
}
|
|
|
|
BX_CPP_INLINE unsigned tzcntq(Bit64u val_64)
|
|
{
|
|
Bit64u mask = 0x1;
|
|
unsigned count = 0;
|
|
|
|
while ((val_64 & mask) == 0 && mask) {
|
|
mask <<= 1;
|
|
count++;
|
|
}
|
|
|
|
return count;
|
|
}
|
|
|
|
// lzcnt
|
|
|
|
BX_CPP_INLINE unsigned lzcntw(Bit16u val_16)
|
|
{
|
|
Bit16u mask = 0x8000;
|
|
unsigned count = 0;
|
|
|
|
while ((val_16 & mask) == 0 && mask) {
|
|
mask >>= 1;
|
|
count++;
|
|
}
|
|
|
|
return count;
|
|
}
|
|
|
|
BX_CPP_INLINE unsigned lzcntd(Bit32u val_32)
|
|
{
|
|
Bit32u mask = 0x80000000;
|
|
unsigned count = 0;
|
|
|
|
while ((val_32 & mask) == 0 && mask) {
|
|
mask >>= 1;
|
|
count++;
|
|
}
|
|
|
|
return count;
|
|
}
|
|
|
|
BX_CPP_INLINE unsigned lzcntq(Bit64u val_64)
|
|
{
|
|
Bit64u mask = BX_CONST64(0x8000000000000000);
|
|
unsigned count = 0;
|
|
|
|
while ((val_64 & mask) == 0 && mask) {
|
|
mask >>= 1;
|
|
count++;
|
|
}
|
|
|
|
return count;
|
|
}
|
|
|
|
// popcnt
|
|
|
|
BX_CPP_INLINE unsigned popcntb(Bit8u val_8)
|
|
{
|
|
val_8 = ((val_8>>1) & 0x55) + (val_8 & 0x55);
|
|
val_8 = ((val_8>>2) & 0x33) + (val_8 & 0x33);
|
|
val_8 = ((val_8>>4) & 0x0F) + (val_8 & 0x0F);
|
|
|
|
return val_8;
|
|
}
|
|
|
|
BX_CPP_INLINE unsigned popcntw(Bit16u val_16)
|
|
{
|
|
val_16 = ((val_16>>1) & 0x5555) + (val_16 & 0x5555);
|
|
val_16 = ((val_16>>2) & 0x3333) + (val_16 & 0x3333);
|
|
val_16 = ((val_16>>4) & 0x0F0F) + (val_16 & 0x0F0F);
|
|
val_16 = ((val_16>>8) & 0x00FF) + (val_16 & 0x00FF);
|
|
|
|
return val_16;
|
|
}
|
|
|
|
BX_CPP_INLINE unsigned popcntd(Bit32u val_32)
|
|
{
|
|
val_32 = ((val_32 >> 1) & 0x55555555) + (val_32 & 0x55555555);
|
|
val_32 = ((val_32 >> 2) & 0x33333333) + (val_32 & 0x33333333);
|
|
val_32 = ((val_32 >> 4) & 0x0F0F0F0F) + (val_32 & 0x0F0F0F0F);
|
|
val_32 = ((val_32 >> 8) & 0x00FF00FF) + (val_32 & 0x00FF00FF);
|
|
val_32 = ((val_32 >> 16) & 0x0000FFFF) + (val_32 & 0x0000FFFF);
|
|
|
|
return val_32;
|
|
}
|
|
|
|
BX_CPP_INLINE unsigned popcntq(Bit64u val_64)
|
|
{
|
|
val_64 = ((val_64 >> 1) & BX_CONST64(0x5555555555555555)) + (val_64 & BX_CONST64(0x5555555555555555));
|
|
val_64 = ((val_64 >> 2) & BX_CONST64(0x3333333333333333)) + (val_64 & BX_CONST64(0x3333333333333333));
|
|
val_64 = ((val_64 >> 4) & BX_CONST64(0x0F0F0F0F0F0F0F0F)) + (val_64 & BX_CONST64(0x0F0F0F0F0F0F0F0F));
|
|
val_64 = ((val_64 >> 8) & BX_CONST64(0x00FF00FF00FF00FF)) + (val_64 & BX_CONST64(0x00FF00FF00FF00FF));
|
|
val_64 = ((val_64 >> 16) & BX_CONST64(0x0000FFFF0000FFFF)) + (val_64 & BX_CONST64(0x0000FFFF0000FFFF));
|
|
val_64 = ((val_64 >> 32) & BX_CONST64(0x00000000FFFFFFFF)) + (val_64 & BX_CONST64(0x00000000FFFFFFFF));
|
|
|
|
return val_64;
|
|
}
|
|
|
|
// bit extract
|
|
|
|
BX_CPP_INLINE Bit32u bextrd(Bit32u val_32, unsigned start, unsigned len)
|
|
{
|
|
Bit32u result = 0;
|
|
|
|
if (start < 32 && len > 0) {
|
|
result = val_32 >> start;
|
|
|
|
if (len < 32) {
|
|
Bit32u extract_mask = (1 << len) - 1;
|
|
result &= extract_mask;
|
|
}
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
BX_CPP_INLINE Bit64u bextrq(Bit64u val_64, unsigned start, unsigned len)
|
|
{
|
|
Bit64u result = 0;
|
|
|
|
if (start < 64 && len > 0) {
|
|
result = val_64 >> start;
|
|
|
|
if (len < 64) {
|
|
Bit64u extract_mask = (BX_CONST64(1) << len) - 1;
|
|
result &= extract_mask;
|
|
}
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
#endif
|