bgfx/src/vertexdecl.cpp
Branimir Karadžić f1a8c5f195 Cleanup.
2016-09-27 22:07:53 -07:00

861 lines
20 KiB
C++

/*
* Copyright 2011-2016 Branimir Karadzic. All rights reserved.
* License: https://github.com/bkaradzic/bgfx#license-bsd-2-clause
*/
#include <string.h>
#include <bx/debug.h>
#include <bx/hash.h>
#include <bx/readerwriter.h>
#include <bx/radixsort.h>
#include <bx/string.h>
#include <bx/uint32_t.h>
#include "config.h"
#include "vertexdecl.h"
namespace bgfx
{
static const uint8_t s_attribTypeSizeDx9[AttribType::Count][4] =
{
{ 4, 4, 4, 4 }, // Uint8
{ 4, 4, 4, 4 }, // Uint10
{ 4, 4, 8, 8 }, // Int16
{ 4, 4, 8, 8 }, // Half
{ 4, 8, 12, 16 }, // Float
};
static const uint8_t s_attribTypeSizeDx1x[AttribType::Count][4] =
{
{ 1, 2, 4, 4 }, // Uint8
{ 4, 4, 4, 4 }, // Uint10
{ 2, 4, 8, 8 }, // Int16
{ 2, 4, 8, 8 }, // Half
{ 4, 8, 12, 16 }, // Float
};
static const uint8_t s_attribTypeSizeGl[AttribType::Count][4] =
{
{ 1, 2, 4, 4 }, // Uint8
{ 4, 4, 4, 4 }, // Uint10
{ 2, 4, 6, 8 }, // Int16
{ 2, 4, 6, 8 }, // Half
{ 4, 8, 12, 16 }, // Float
};
static const uint8_t (*s_attribTypeSize[])[AttribType::Count][4] =
{
&s_attribTypeSizeDx9, // Null
&s_attribTypeSizeDx9, // Direct3D9
&s_attribTypeSizeDx1x, // Direct3D11
&s_attribTypeSizeDx1x, // Direct3D12
&s_attribTypeSizeGl, // Gnm
&s_attribTypeSizeGl, // Metal
&s_attribTypeSizeGl, // OpenGLES
&s_attribTypeSizeGl, // OpenGL
&s_attribTypeSizeGl, // Vulkan
&s_attribTypeSizeDx9, // Count
};
BX_STATIC_ASSERT(BX_COUNTOF(s_attribTypeSize) == RendererType::Count+1);
void initAttribTypeSizeTable(RendererType::Enum _type)
{
s_attribTypeSize[0] = s_attribTypeSize[_type];
s_attribTypeSize[RendererType::Count] = s_attribTypeSize[_type];
}
void dbgPrintfVargs(const char* _format, va_list _argList)
{
char temp[8192];
char* out = temp;
int32_t len = bx::vsnprintf(out, sizeof(temp), _format, _argList);
if ( (int32_t)sizeof(temp) < len)
{
out = (char*)alloca(len+1);
len = bx::vsnprintf(out, len, _format, _argList);
}
out[len] = '\0';
bx::debugOutput(out);
}
void dbgPrintf(const char* _format, ...)
{
va_list argList;
va_start(argList, _format);
dbgPrintfVargs(_format, argList);
va_end(argList);
}
VertexDecl::VertexDecl()
{
// BK - struct need to have ctor to qualify as non-POD data.
// Need this to catch programming errors when serializing struct.
}
VertexDecl& VertexDecl::begin(RendererType::Enum _renderer)
{
m_hash = _renderer; // use hash to store renderer type while building VertexDecl.
m_stride = 0;
memset(m_attributes, 0xff, sizeof(m_attributes) );
memset(m_offset, 0, sizeof(m_offset) );
return *this;
}
void VertexDecl::end()
{
bx::HashMurmur2A murmur;
murmur.begin();
murmur.add(m_attributes, sizeof(m_attributes) );
murmur.add(m_offset, sizeof(m_offset) );
murmur.add(m_stride);
m_hash = murmur.end();
}
VertexDecl& VertexDecl::add(Attrib::Enum _attrib, uint8_t _num, AttribType::Enum _type, bool _normalized, bool _asInt)
{
const uint16_t encodedNorm = (_normalized&1)<<7;
const uint16_t encodedType = (_type&7)<<3;
const uint16_t encodedNum = (_num-1)&3;
const uint16_t encodeAsInt = (_asInt&(!!"\x1\x1\x1\x0\x0"[_type]) )<<8;
m_attributes[_attrib] = encodedNorm|encodedType|encodedNum|encodeAsInt;
m_offset[_attrib] = m_stride;
m_stride += (*s_attribTypeSize[m_hash])[_type][_num-1];
return *this;
}
VertexDecl& VertexDecl::skip(uint8_t _num)
{
m_stride += _num;
return *this;
}
void VertexDecl::decode(Attrib::Enum _attrib, uint8_t& _num, AttribType::Enum& _type, bool& _normalized, bool& _asInt) const
{
uint16_t val = m_attributes[_attrib];
_num = (val&3)+1;
_type = AttribType::Enum( (val>>3)&7);
_normalized = !!(val&(1<<7) );
_asInt = !!(val&(1<<8) );
}
static const char* s_attrName[] =
{
"Attrib::Position",
"Attrib::Normal",
"Attrib::Tangent",
"Attrib::Bitangent",
"Attrib::Color0",
"Attrib::Color1",
"Attrib::Indices",
"Attrib::Weights",
"Attrib::TexCoord0",
"Attrib::TexCoord1",
"Attrib::TexCoord2",
"Attrib::TexCoord3",
"Attrib::TexCoord4",
"Attrib::TexCoord5",
"Attrib::TexCoord6",
"Attrib::TexCoord7",
};
BX_STATIC_ASSERT(BX_COUNTOF(s_attrName) == Attrib::Count);
const char* getAttribName(Attrib::Enum _attr)
{
return s_attrName[_attr];
}
void dump(const VertexDecl& _decl)
{
if (BX_ENABLED(BGFX_CONFIG_DEBUG) )
{
dbgPrintf("vertexdecl %08x (%08x), stride %d\n"
, _decl.m_hash
, bx::hashMurmur2A(_decl.m_attributes)
, _decl.m_stride
);
for (uint32_t attr = 0; attr < Attrib::Count; ++attr)
{
if (UINT16_MAX != _decl.m_attributes[attr])
{
uint8_t num;
AttribType::Enum type;
bool normalized;
bool asInt;
_decl.decode(Attrib::Enum(attr), num, type, normalized, asInt);
dbgPrintf("\tattr %d - %s, num %d, type %d, norm %d, asint %d, offset %d\n"
, attr
, getAttribName(Attrib::Enum(attr) )
, num
, type
, normalized
, asInt
, _decl.m_offset[attr]
);
}
}
}
}
struct AttribToId
{
Attrib::Enum attr;
uint16_t id;
};
static AttribToId s_attribToId[] =
{
// NOTICE:
// Attrib must be in order how it appears in Attrib::Enum! id is
// unique and should not be changed if new Attribs are added.
{ Attrib::Position, 0x0001 },
{ Attrib::Normal, 0x0002 },
{ Attrib::Tangent, 0x0003 },
{ Attrib::Bitangent, 0x0004 },
{ Attrib::Color0, 0x0005 },
{ Attrib::Color1, 0x0006 },
{ Attrib::Indices, 0x000e },
{ Attrib::Weight, 0x000f },
{ Attrib::TexCoord0, 0x0010 },
{ Attrib::TexCoord1, 0x0011 },
{ Attrib::TexCoord2, 0x0012 },
{ Attrib::TexCoord3, 0x0013 },
{ Attrib::TexCoord4, 0x0014 },
{ Attrib::TexCoord5, 0x0015 },
{ Attrib::TexCoord6, 0x0016 },
{ Attrib::TexCoord7, 0x0017 },
};
BX_STATIC_ASSERT(BX_COUNTOF(s_attribToId) == Attrib::Count);
Attrib::Enum idToAttrib(uint16_t id)
{
for (uint32_t ii = 0; ii < BX_COUNTOF(s_attribToId); ++ii)
{
if (s_attribToId[ii].id == id)
{
return s_attribToId[ii].attr;
}
}
return Attrib::Count;
}
uint16_t attribToId(Attrib::Enum _attr)
{
return s_attribToId[_attr].id;
}
struct AttribTypeToId
{
AttribType::Enum type;
uint16_t id;
};
static AttribTypeToId s_attribTypeToId[] =
{
// NOTICE:
// AttribType must be in order how it appears in AttribType::Enum!
// id is unique and should not be changed if new AttribTypes are
// added.
{ AttribType::Uint8, 0x0001 },
{ AttribType::Uint10, 0x0005 },
{ AttribType::Int16, 0x0002 },
{ AttribType::Half, 0x0003 },
{ AttribType::Float, 0x0004 },
};
BX_STATIC_ASSERT(BX_COUNTOF(s_attribTypeToId) == AttribType::Count);
AttribType::Enum idToAttribType(uint16_t id)
{
for (uint32_t ii = 0; ii < BX_COUNTOF(s_attribTypeToId); ++ii)
{
if (s_attribTypeToId[ii].id == id)
{
return s_attribTypeToId[ii].type;
}
}
return AttribType::Count;
}
uint16_t attribTypeToId(AttribType::Enum _attr)
{
return s_attribTypeToId[_attr].id;
}
int32_t write(bx::WriterI* _writer, const VertexDecl& _decl, bx::Error* _err)
{
BX_ERROR_SCOPE(_err);
int32_t total = 0;
uint8_t numAttrs = 0;
for (uint32_t attr = 0; attr < Attrib::Count; ++attr)
{
numAttrs += UINT16_MAX == _decl.m_attributes[attr] ? 0 : 1;
}
total += bx::write(_writer, numAttrs, _err);
total += bx::write(_writer, _decl.m_stride, _err);
for (uint32_t attr = 0; attr < Attrib::Count; ++attr)
{
if (UINT16_MAX != _decl.m_attributes[attr])
{
uint8_t num;
AttribType::Enum type;
bool normalized;
bool asInt;
_decl.decode(Attrib::Enum(attr), num, type, normalized, asInt);
total += bx::write(_writer, _decl.m_offset[attr], _err);
total += bx::write(_writer, s_attribToId[attr].id, _err);
total += bx::write(_writer, num, _err);
total += bx::write(_writer, s_attribTypeToId[type].id, _err);
total += bx::write(_writer, normalized, _err);
total += bx::write(_writer, asInt, _err);
}
}
return total;
}
int32_t read(bx::ReaderI* _reader, VertexDecl& _decl, bx::Error* _err)
{
BX_ERROR_SCOPE(_err);
int32_t total = 0;
uint8_t numAttrs;
total += bx::read(_reader, numAttrs, _err);
uint16_t stride;
total += bx::read(_reader, stride, _err);
if (!_err->isOk() )
{
return total;
}
_decl.begin();
for (uint32_t ii = 0; ii < numAttrs; ++ii)
{
uint16_t offset;
total += bx::read(_reader, offset, _err);
uint16_t attribId = 0;
total += bx::read(_reader, attribId, _err);
uint8_t num;
total += bx::read(_reader, num, _err);
uint16_t attribTypeId;
total += bx::read(_reader, attribTypeId, _err);
bool normalized;
total += bx::read(_reader, normalized, _err);
bool asInt;
total += bx::read(_reader, asInt, _err);
if (!_err->isOk() )
{
return total;
}
Attrib::Enum attr = idToAttrib(attribId);
AttribType::Enum type = idToAttribType(attribTypeId);
if (Attrib::Count != attr
&& AttribType::Count != type)
{
_decl.add(attr, num, type, normalized, asInt);
_decl.m_offset[attr] = offset;
}
}
_decl.end();
_decl.m_stride = stride;
return total;
}
void vertexPack(const float _input[4], bool _inputNormalized, Attrib::Enum _attr, const VertexDecl& _decl, void* _data, uint32_t _index)
{
if (!_decl.has(_attr) )
{
return;
}
uint32_t stride = _decl.getStride();
uint8_t* data = (uint8_t*)_data + _index*stride + _decl.getOffset(_attr);
uint8_t num;
AttribType::Enum type;
bool normalized;
bool asInt;
_decl.decode(_attr, num, type, normalized, asInt);
switch (type)
{
default:
case AttribType::Uint8:
{
uint8_t* packed = (uint8_t*)data;
if (_inputNormalized)
{
if (asInt)
{
switch (num)
{
default: *packed++ = uint8_t(*_input++ * 127.0f + 128.0f);
case 3: *packed++ = uint8_t(*_input++ * 127.0f + 128.0f);
case 2: *packed++ = uint8_t(*_input++ * 127.0f + 128.0f);
case 1: *packed++ = uint8_t(*_input++ * 127.0f + 128.0f);
}
}
else
{
switch (num)
{
default: *packed++ = uint8_t(*_input++ * 255.0f);
case 3: *packed++ = uint8_t(*_input++ * 255.0f);
case 2: *packed++ = uint8_t(*_input++ * 255.0f);
case 1: *packed++ = uint8_t(*_input++ * 255.0f);
}
}
}
else
{
switch (num)
{
default: *packed++ = uint8_t(*_input++);
case 3: *packed++ = uint8_t(*_input++);
case 2: *packed++ = uint8_t(*_input++);
case 1: *packed++ = uint8_t(*_input++);
}
}
}
break;
case AttribType::Uint10:
{
uint32_t packed = 0;
if (_inputNormalized)
{
if (asInt)
{
switch (num)
{
default:
case 3: packed |= uint32_t(*_input++ * 511.0f + 512.0f);
case 2: packed <<= 10; packed |= uint32_t(*_input++ * 511.0f + 512.0f);
case 1: packed <<= 10; packed |= uint32_t(*_input++ * 511.0f + 512.0f);
}
}
else
{
switch (num)
{
default:
case 3: packed |= uint32_t(*_input++ * 1023.0f);
case 2: packed <<= 10; packed |= uint32_t(*_input++ * 1023.0f);
case 1: packed <<= 10; packed |= uint32_t(*_input++ * 1023.0f);
}
}
}
else
{
switch (num)
{
default:
case 3: packed |= uint32_t(*_input++);
case 2: packed <<= 10; packed |= uint32_t(*_input++);
case 1: packed <<= 10; packed |= uint32_t(*_input++);
}
}
*(uint32_t*)data = packed;
}
break;
case AttribType::Int16:
{
int16_t* packed = (int16_t*)data;
if (_inputNormalized)
{
if (asInt)
{
switch (num)
{
default: *packed++ = int16_t(*_input++ * 32767.0f);
case 3: *packed++ = int16_t(*_input++ * 32767.0f);
case 2: *packed++ = int16_t(*_input++ * 32767.0f);
case 1: *packed++ = int16_t(*_input++ * 32767.0f);
}
}
else
{
switch (num)
{
default: *packed++ = int16_t(*_input++ * 65535.0f - 32768.0f);
case 3: *packed++ = int16_t(*_input++ * 65535.0f - 32768.0f);
case 2: *packed++ = int16_t(*_input++ * 65535.0f - 32768.0f);
case 1: *packed++ = int16_t(*_input++ * 65535.0f - 32768.0f);
}
}
}
else
{
switch (num)
{
default: *packed++ = int16_t(*_input++);
case 3: *packed++ = int16_t(*_input++);
case 2: *packed++ = int16_t(*_input++);
case 1: *packed++ = int16_t(*_input++);
}
}
}
break;
case AttribType::Half:
{
uint16_t* packed = (uint16_t*)data;
switch (num)
{
default: *packed++ = bx::halfFromFloat(*_input++);
case 3: *packed++ = bx::halfFromFloat(*_input++);
case 2: *packed++ = bx::halfFromFloat(*_input++);
case 1: *packed++ = bx::halfFromFloat(*_input++);
}
}
break;
case AttribType::Float:
memcpy(data, _input, num*sizeof(float) );
break;
}
}
void vertexUnpack(float _output[4], Attrib::Enum _attr, const VertexDecl& _decl, const void* _data, uint32_t _index)
{
if (!_decl.has(_attr) )
{
memset(_output, 0, 4*sizeof(float) );
return;
}
uint32_t stride = _decl.getStride();
uint8_t* data = (uint8_t*)_data + _index*stride + _decl.getOffset(_attr);
uint8_t num;
AttribType::Enum type;
bool normalized;
bool asInt;
_decl.decode(_attr, num, type, normalized, asInt);
switch (type)
{
default:
case AttribType::Uint8:
{
uint8_t* packed = (uint8_t*)data;
if (asInt)
{
switch (num)
{
default: *_output++ = (float(*packed++) - 128.0f)*1.0f/127.0f;
case 3: *_output++ = (float(*packed++) - 128.0f)*1.0f/127.0f;
case 2: *_output++ = (float(*packed++) - 128.0f)*1.0f/127.0f;
case 1: *_output++ = (float(*packed++) - 128.0f)*1.0f/127.0f;
}
}
else
{
switch (num)
{
default: *_output++ = float(*packed++)*1.0f/255.0f;
case 3: *_output++ = float(*packed++)*1.0f/255.0f;
case 2: *_output++ = float(*packed++)*1.0f/255.0f;
case 1: *_output++ = float(*packed++)*1.0f/255.0f;
}
}
}
break;
case AttribType::Uint10:
{
uint32_t packed = *(uint32_t*)data;
if (asInt)
{
switch (num)
{
default:
case 3: *_output++ = (float(packed & 0x3ff) - 512.0f)*1.0f/511.0f; packed >>= 10;
case 2: *_output++ = (float(packed & 0x3ff) - 512.0f)*1.0f/511.0f; packed >>= 10;
case 1: *_output++ = (float(packed & 0x3ff) - 512.0f)*1.0f/511.0f;
}
}
else
{
switch (num)
{
default:
case 3: *_output++ = float(packed & 0x3ff)*1.0f/1023.0f; packed >>= 10;
case 2: *_output++ = float(packed & 0x3ff)*1.0f/1023.0f; packed >>= 10;
case 1: *_output++ = float(packed & 0x3ff)*1.0f/1023.0f;
}
}
}
break;
case AttribType::Int16:
{
int16_t* packed = (int16_t*)data;
if (asInt)
{
switch (num)
{
default: *_output++ = float(*packed++)*1.0f/32767.0f;
case 3: *_output++ = float(*packed++)*1.0f/32767.0f;
case 2: *_output++ = float(*packed++)*1.0f/32767.0f;
case 1: *_output++ = float(*packed++)*1.0f/32767.0f;
}
}
else
{
switch (num)
{
default: *_output++ = (float(*packed++) + 32768.0f)*1.0f/65535.0f;
case 3: *_output++ = (float(*packed++) + 32768.0f)*1.0f/65535.0f;
case 2: *_output++ = (float(*packed++) + 32768.0f)*1.0f/65535.0f;
case 1: *_output++ = (float(*packed++) + 32768.0f)*1.0f/65535.0f;
}
}
}
break;
case AttribType::Half:
{
uint16_t* packed = (uint16_t*)data;
switch (num)
{
default: *_output++ = bx::halfToFloat(*packed++);
case 3: *_output++ = bx::halfToFloat(*packed++);
case 2: *_output++ = bx::halfToFloat(*packed++);
case 1: *_output++ = bx::halfToFloat(*packed++);
}
}
break;
case AttribType::Float:
memcpy(_output, data, num*sizeof(float) );
_output += num;
break;
}
switch (num)
{
case 1: *_output++ = 0.0f;
case 2: *_output++ = 0.0f;
case 3: *_output++ = 0.0f;
default: break;
}
}
void vertexConvert(const VertexDecl& _destDecl, void* _destData, const VertexDecl& _srcDecl, const void* _srcData, uint32_t _num)
{
if (_destDecl.m_hash == _srcDecl.m_hash)
{
memcpy(_destData, _srcData, _srcDecl.getSize(_num) );
return;
}
struct ConvertOp
{
enum Enum
{
Set,
Copy,
Convert,
};
Attrib::Enum attr;
Enum op;
uint32_t src;
uint32_t dest;
uint32_t size;
};
ConvertOp convertOp[Attrib::Count];
uint32_t numOps = 0;
for (uint32_t ii = 0; ii < Attrib::Count; ++ii)
{
Attrib::Enum attr = (Attrib::Enum)ii;
if (_destDecl.has(attr) )
{
ConvertOp& cop = convertOp[numOps];
cop.attr = attr;
cop.dest = _destDecl.getOffset(attr);
uint8_t num;
AttribType::Enum type;
bool normalized;
bool asInt;
_destDecl.decode(attr, num, type, normalized, asInt);
cop.size = (*s_attribTypeSize[0])[type][num-1];
if (_srcDecl.has(attr) )
{
cop.src = _srcDecl.getOffset(attr);
cop.op = _destDecl.m_attributes[attr] == _srcDecl.m_attributes[attr] ? ConvertOp::Copy : ConvertOp::Convert;
}
else
{
cop.op = ConvertOp::Set;
}
++numOps;
}
}
if (0 < numOps)
{
const uint8_t* src = (const uint8_t*)_srcData;
uint32_t srcStride = _srcDecl.getStride();
uint8_t* dest = (uint8_t*)_destData;
uint32_t destStride = _destDecl.getStride();
float unpacked[4];
for (uint32_t ii = 0; ii < _num; ++ii)
{
for (uint32_t jj = 0; jj < numOps; ++jj)
{
const ConvertOp& cop = convertOp[jj];
switch (cop.op)
{
case ConvertOp::Set:
memset(dest + cop.dest, 0, cop.size);
break;
case ConvertOp::Copy:
memcpy(dest + cop.dest, src + cop.src, cop.size);
break;
case ConvertOp::Convert:
vertexUnpack(unpacked, cop.attr, _srcDecl, src);
vertexPack(unpacked, true, cop.attr, _destDecl, dest);
break;
}
}
src += srcStride;
dest += destStride;
}
}
}
inline float sqLength(const float _a[3], const float _b[3])
{
const float xx = _a[0] - _b[0];
const float yy = _a[1] - _b[1];
const float zz = _a[2] - _b[2];
return xx*xx + yy*yy + zz*zz;
}
uint16_t weldVerticesRef(uint16_t* _output, const VertexDecl& _decl, const void* _data, uint16_t _num, float _epsilon)
{
// Brute force slow vertex welding...
const float epsilonSq = _epsilon*_epsilon;
uint32_t numVertices = 0;
memset(_output, 0xff, _num*sizeof(uint16_t) );
for (uint32_t ii = 0; ii < _num; ++ii)
{
if (UINT16_MAX != _output[ii])
{
continue;
}
_output[ii] = (uint16_t)ii;
++numVertices;
float pos[4];
vertexUnpack(pos, Attrib::Position, _decl, _data, ii);
for (uint32_t jj = 0; jj < _num; ++jj)
{
if (UINT16_MAX != _output[jj])
{
continue;
}
float test[4];
vertexUnpack(test, Attrib::Position, _decl, _data, jj);
if (sqLength(test, pos) < epsilonSq)
{
_output[jj] = (uint16_t)ii;
}
}
}
return (uint16_t)numVertices;
}
uint16_t weldVertices(uint16_t* _output, const VertexDecl& _decl, const void* _data, uint16_t _num, float _epsilon)
{
const uint32_t hashSize = bx::uint32_nextpow2(_num);
const uint32_t hashMask = hashSize-1;
const float epsilonSq = _epsilon*_epsilon;
uint32_t numVertices = 0;
const uint32_t size = sizeof(uint16_t)*(hashSize + _num);
uint16_t* hashTable = (uint16_t*)alloca(size);
memset(hashTable, 0xff, size);
uint16_t* next = hashTable + hashSize;
for (uint32_t ii = 0; ii < _num; ++ii)
{
float pos[4];
vertexUnpack(pos, Attrib::Position, _decl, _data, ii);
uint32_t hashValue = bx::hashMurmur2A(pos, 3*sizeof(float) ) & hashMask;
uint16_t offset = hashTable[hashValue];
for (; UINT16_MAX != offset; offset = next[offset])
{
float test[4];
vertexUnpack(test, Attrib::Position, _decl, _data, _output[offset]);
if (sqLength(test, pos) < epsilonSq)
{
_output[ii] = _output[offset];
break;
}
}
if (UINT16_MAX == offset)
{
_output[ii] = (uint16_t)ii;
next[ii] = hashTable[hashValue];
hashTable[hashValue] = (uint16_t)ii;
numVertices++;
}
}
return (uint16_t)numVertices;
}
} // namespace bgfx