/* * Copyright 2011-2015 Branimir Karadzic. All rights reserved. * License: http://www.opensource.org/licenses/BSD-2-Clause */ #include #include #include #include #include #include #include "config.h" #include "vertexdecl.h" namespace bgfx { static const uint8_t s_attribTypeSizeDx9[AttribType::Count][4] = { { 4, 4, 4, 4 }, { 4, 4, 8, 8 }, { 4, 4, 8, 8 }, { 4, 8, 12, 16 }, }; static const uint8_t s_attribTypeSizeDx1x[AttribType::Count][4] = { { 1, 2, 4, 4 }, { 2, 4, 8, 8 }, { 2, 4, 8, 8 }, { 4, 8, 12, 16 }, }; static const uint8_t s_attribTypeSizeGl[AttribType::Count][4] = { { 1, 2, 4, 4 }, { 2, 4, 6, 8 }, { 2, 4, 6, 8 }, { 4, 8, 12, 16 }, }; static const uint8_t (*s_attribTypeSize[])[AttribType::Count][4] = { &s_attribTypeSizeDx9, // Null &s_attribTypeSizeDx9, // Direct3D9 &s_attribTypeSizeDx1x, // Direct3D11 &s_attribTypeSizeDx1x, // Direct3D12 &s_attribTypeSizeGl, // OpenGLES &s_attribTypeSizeGl, // OpenGL &s_attribTypeSizeGl, // Vulkan &s_attribTypeSizeDx9, // Count }; BX_STATIC_ASSERT(BX_COUNTOF(s_attribTypeSize) == RendererType::Count+1); void initAttribTypeSizeTable(RendererType::Enum _type) { s_attribTypeSize[0] = s_attribTypeSize[_type]; s_attribTypeSize[RendererType::Count] = s_attribTypeSize[_type]; } void dbgPrintfVargs(const char* _format, va_list _argList) { char temp[8192]; char* out = temp; int32_t len = bx::vsnprintf(out, sizeof(temp), _format, _argList); if ( (int32_t)sizeof(temp) < len) { out = (char*)alloca(len+1); len = bx::vsnprintf(out, len, _format, _argList); } out[len] = '\0'; bx::debugOutput(out); } void dbgPrintf(const char* _format, ...) { va_list argList; va_start(argList, _format); dbgPrintfVargs(_format, argList); va_end(argList); } VertexDecl::VertexDecl() { // BK - struct need to have ctor to qualify as non-POD data. // Need this to catch programming errors when serializing struct. } VertexDecl& VertexDecl::begin(RendererType::Enum _renderer) { m_hash = _renderer; // use hash to store renderer type while building VertexDecl. m_stride = 0; memset(m_attributes, 0xff, sizeof(m_attributes) ); memset(m_offset, 0, sizeof(m_offset) ); return *this; } void VertexDecl::end() { bx::HashMurmur2A murmur; murmur.begin(); murmur.add(m_attributes, sizeof(m_attributes) ); murmur.add(m_offset, sizeof(m_offset) ); m_hash = murmur.end(); } VertexDecl& VertexDecl::add(Attrib::Enum _attrib, uint8_t _num, AttribType::Enum _type, bool _normalized, bool _asInt) { const uint8_t encodedNorm = (_normalized&1)<<6; const uint8_t encodedType = (_type&3)<<3; const uint8_t encodedNum = (_num-1)&3; const uint8_t encodeAsInt = (_asInt&(!!"\x1\x1\x0\x0"[_type]) )<<7; m_attributes[_attrib] = encodedNorm|encodedType|encodedNum|encodeAsInt; m_offset[_attrib] = m_stride; m_stride += (*s_attribTypeSize[m_hash])[_type][_num-1]; return *this; } VertexDecl& VertexDecl::skip(uint8_t _num) { m_stride += _num; return *this; } void VertexDecl::decode(Attrib::Enum _attrib, uint8_t& _num, AttribType::Enum& _type, bool& _normalized, bool& _asInt) const { uint8_t val = m_attributes[_attrib]; _num = (val&3)+1; _type = AttribType::Enum((val>>3)&3); _normalized = !!(val&(1<<6) ); _asInt = !!(val&(1<<7) ); } static const char* s_attrName[] = { "Attrib::Position", "Attrib::Normal", "Attrib::Tangent", "Attrib::Bitangent", "Attrib::Color0", "Attrib::Color1", "Attrib::Indices", "Attrib::Weights", "Attrib::TexCoord0", "Attrib::TexCoord1", "Attrib::TexCoord2", "Attrib::TexCoord3", "Attrib::TexCoord4", "Attrib::TexCoord5", "Attrib::TexCoord6", "Attrib::TexCoord7", }; BX_STATIC_ASSERT(BX_COUNTOF(s_attrName) == Attrib::Count); const char* getAttribName(Attrib::Enum _attr) { return s_attrName[_attr]; } void dump(const VertexDecl& _decl) { if (BX_ENABLED(BGFX_CONFIG_DEBUG) ) { dbgPrintf("vertexdecl %08x (%08x), stride %d\n" , _decl.m_hash , bx::hashMurmur2A(_decl.m_attributes) , _decl.m_stride ); for (uint32_t attr = 0; attr < Attrib::Count; ++attr) { if (0xff != _decl.m_attributes[attr]) { uint8_t num; AttribType::Enum type; bool normalized; bool asInt; _decl.decode(Attrib::Enum(attr), num, type, normalized, asInt); dbgPrintf("\tattr %d - %s, num %d, type %d, norm %d, asint %d, offset %d\n" , attr , getAttribName(Attrib::Enum(attr) ) , num , type , normalized , asInt , _decl.m_offset[attr] ); } } } } struct AttribToId { Attrib::Enum attr; uint16_t id; }; static AttribToId s_attribToId[] = { // NOTICE: // Attrib must be in order how it appears in Attrib::Enum! id is // unique and should not be changed if new Attribs are added. { Attrib::Position, 0x0001 }, { Attrib::Normal, 0x0002 }, { Attrib::Tangent, 0x0003 }, { Attrib::Bitangent, 0x0004 }, { Attrib::Color0, 0x0005 }, { Attrib::Color1, 0x0006 }, { Attrib::Indices, 0x000e }, { Attrib::Weight, 0x000f }, { Attrib::TexCoord0, 0x0010 }, { Attrib::TexCoord1, 0x0011 }, { Attrib::TexCoord2, 0x0012 }, { Attrib::TexCoord3, 0x0013 }, { Attrib::TexCoord4, 0x0014 }, { Attrib::TexCoord5, 0x0015 }, { Attrib::TexCoord6, 0x0016 }, { Attrib::TexCoord7, 0x0017 }, }; BX_STATIC_ASSERT(BX_COUNTOF(s_attribToId) == Attrib::Count); Attrib::Enum idToAttrib(uint16_t id) { for (uint32_t ii = 0; ii < BX_COUNTOF(s_attribToId); ++ii) { if (s_attribToId[ii].id == id) { return s_attribToId[ii].attr; } } return Attrib::Count; } uint16_t attribToId(Attrib::Enum _attr) { return s_attribToId[_attr].id; } struct AttribTypeToId { AttribType::Enum type; uint16_t id; }; static AttribTypeToId s_attribTypeToId[] = { // NOTICE: // AttribType must be in order how it appears in AttribType::Enum! // id is unique and should not be changed if new AttribTypes are // added. { AttribType::Uint8, 0x0001 }, { AttribType::Int16, 0x0002 }, { AttribType::Half, 0x0003 }, { AttribType::Float, 0x0004 }, }; BX_STATIC_ASSERT(BX_COUNTOF(s_attribTypeToId) == AttribType::Count); AttribType::Enum idToAttribType(uint16_t id) { for (uint32_t ii = 0; ii < BX_COUNTOF(s_attribTypeToId); ++ii) { if (s_attribTypeToId[ii].id == id) { return s_attribTypeToId[ii].type; } } return AttribType::Count; } uint16_t attribTypeToId(AttribType::Enum _attr) { return s_attribTypeToId[_attr].id; } int32_t write(bx::WriterI* _writer, const VertexDecl& _decl) { int32_t total = 0; uint8_t numAttrs = 0; for (uint32_t attr = 0; attr < Attrib::Count; ++attr) { numAttrs += 0xff == _decl.m_attributes[attr] ? 0 : 1; } total += bx::write(_writer, numAttrs); total += bx::write(_writer, _decl.m_stride); for (uint32_t attr = 0; attr < Attrib::Count; ++attr) { if (0xff != _decl.m_attributes[attr]) { uint8_t num; AttribType::Enum type; bool normalized; bool asInt; _decl.decode(Attrib::Enum(attr), num, type, normalized, asInt); total += bx::write(_writer, _decl.m_offset[attr]); total += bx::write(_writer, s_attribToId[attr].id); total += bx::write(_writer, num); total += bx::write(_writer, s_attribTypeToId[type].id); total += bx::write(_writer, normalized); total += bx::write(_writer, asInt); } } return total; } int32_t read(bx::ReaderI* _reader, VertexDecl& _decl) { int32_t total = 0; uint8_t numAttrs; total += bx::read(_reader, numAttrs); uint16_t stride; total += bx::read(_reader, stride); _decl.begin(); for (uint32_t ii = 0; ii < numAttrs; ++ii) { uint16_t offset; total += bx::read(_reader, offset); uint16_t attribId = 0; total += bx::read(_reader, attribId); uint8_t num; total += bx::read(_reader, num); uint16_t attribTypeId; total += bx::read(_reader, attribTypeId); bool normalized; total += bx::read(_reader, normalized); bool asInt; total += bx::read(_reader, asInt); Attrib::Enum attr = idToAttrib(attribId); AttribType::Enum type = idToAttribType(attribTypeId); if (Attrib::Count != attr && AttribType::Count != type) { _decl.add(attr, num, type, normalized, asInt); _decl.m_offset[attr] = offset; } } _decl.end(); _decl.m_stride = stride; return total; } void vertexPack(const float _input[4], bool _inputNormalized, Attrib::Enum _attr, const VertexDecl& _decl, void* _data, uint32_t _index) { if (!_decl.has(_attr) ) { return; } uint32_t stride = _decl.getStride(); uint8_t* data = (uint8_t*)_data + _index*stride + _decl.getOffset(_attr); uint8_t num; AttribType::Enum type; bool normalized; bool asInt; _decl.decode(_attr, num, type, normalized, asInt); switch (type) { default: case AttribType::Uint8: { uint8_t* packed = (uint8_t*)data; if (_inputNormalized) { if (asInt) { switch (num) { default: *packed++ = uint8_t(*_input++ * 127.0f + 128.0f); case 3: *packed++ = uint8_t(*_input++ * 127.0f + 128.0f); case 2: *packed++ = uint8_t(*_input++ * 127.0f + 128.0f); case 1: *packed++ = uint8_t(*_input++ * 127.0f + 128.0f); } } else { switch (num) { default: *packed++ = uint8_t(*_input++ * 255.0f); case 3: *packed++ = uint8_t(*_input++ * 255.0f); case 2: *packed++ = uint8_t(*_input++ * 255.0f); case 1: *packed++ = uint8_t(*_input++ * 255.0f); } } } else { switch (num) { default: *packed++ = uint8_t(*_input++); case 3: *packed++ = uint8_t(*_input++); case 2: *packed++ = uint8_t(*_input++); case 1: *packed++ = uint8_t(*_input++); } } } break; case AttribType::Int16: { int16_t* packed = (int16_t*)data; if (_inputNormalized) { if (asInt) { switch (num) { default: *packed++ = int16_t(*_input++ * 32767.0f); case 3: *packed++ = int16_t(*_input++ * 32767.0f); case 2: *packed++ = int16_t(*_input++ * 32767.0f); case 1: *packed++ = int16_t(*_input++ * 32767.0f); } } else { switch (num) { default: *packed++ = int16_t(*_input++ * 65535.0f - 32768.0f); case 3: *packed++ = int16_t(*_input++ * 65535.0f - 32768.0f); case 2: *packed++ = int16_t(*_input++ * 65535.0f - 32768.0f); case 1: *packed++ = int16_t(*_input++ * 65535.0f - 32768.0f); } } } else { switch (num) { default: *packed++ = int16_t(*_input++); case 3: *packed++ = int16_t(*_input++); case 2: *packed++ = int16_t(*_input++); case 1: *packed++ = int16_t(*_input++); } } } break; case AttribType::Half: { uint16_t* packed = (uint16_t*)data; switch (num) { default: *packed++ = bx::halfFromFloat(*_input++); case 3: *packed++ = bx::halfFromFloat(*_input++); case 2: *packed++ = bx::halfFromFloat(*_input++); case 1: *packed++ = bx::halfFromFloat(*_input++); } } break; case AttribType::Float: memcpy(data, _input, num*sizeof(float) ); break; } } void vertexUnpack(float _output[4], Attrib::Enum _attr, const VertexDecl& _decl, const void* _data, uint32_t _index) { if (!_decl.has(_attr) ) { memset(_output, 0, 4*sizeof(float) ); return; } uint32_t stride = _decl.getStride(); uint8_t* data = (uint8_t*)_data + _index*stride + _decl.getOffset(_attr); uint8_t num; AttribType::Enum type; bool normalized; bool asInt; _decl.decode(_attr, num, type, normalized, asInt); switch (type) { default: case AttribType::Uint8: { uint8_t* packed = (uint8_t*)data; if (asInt) { switch (num) { default: *_output++ = (float(*packed++) - 128.0f)*1.0f/127.0f; case 3: *_output++ = (float(*packed++) - 128.0f)*1.0f/127.0f; case 2: *_output++ = (float(*packed++) - 128.0f)*1.0f/127.0f; case 1: *_output++ = (float(*packed++) - 128.0f)*1.0f/127.0f; } } else { switch (num) { default: *_output++ = float(*packed++)*1.0f/255.0f; case 3: *_output++ = float(*packed++)*1.0f/255.0f; case 2: *_output++ = float(*packed++)*1.0f/255.0f; case 1: *_output++ = float(*packed++)*1.0f/255.0f; } } } break; case AttribType::Int16: { int16_t* packed = (int16_t*)data; if (asInt) { switch (num) { default: *_output++ = float(*packed++)*1.0f/32767.0f; case 3: *_output++ = float(*packed++)*1.0f/32767.0f; case 2: *_output++ = float(*packed++)*1.0f/32767.0f; case 1: *_output++ = float(*packed++)*1.0f/32767.0f; } } else { switch (num) { default: *_output++ = (float(*packed++) + 32768.0f)*1.0f/65535.0f; case 3: *_output++ = (float(*packed++) + 32768.0f)*1.0f/65535.0f; case 2: *_output++ = (float(*packed++) + 32768.0f)*1.0f/65535.0f; case 1: *_output++ = (float(*packed++) + 32768.0f)*1.0f/65535.0f; } } } break; case AttribType::Half: { uint16_t* packed = (uint16_t*)data; switch (num) { default: *_output++ = bx::halfToFloat(*packed++); case 3: *_output++ = bx::halfToFloat(*packed++); case 2: *_output++ = bx::halfToFloat(*packed++); case 1: *_output++ = bx::halfToFloat(*packed++); } } break; case AttribType::Float: memcpy(_output, data, num*sizeof(float) ); _output += num; break; } switch (num) { case 1: *_output++ = 0.0f; case 2: *_output++ = 0.0f; case 3: *_output++ = 0.0f; default: break; } } void vertexConvert(const VertexDecl& _destDecl, void* _destData, const VertexDecl& _srcDecl, const void* _srcData, uint32_t _num) { if (_destDecl.m_hash == _srcDecl.m_hash) { memcpy(_destData, _srcData, _srcDecl.getSize(_num) ); return; } struct ConvertOp { enum Enum { Set, Copy, Convert, }; Attrib::Enum attr; Enum op; uint32_t src; uint32_t dest; uint32_t size; }; ConvertOp convertOp[Attrib::Count]; uint32_t numOps = 0; for (uint32_t ii = 0; ii < Attrib::Count; ++ii) { Attrib::Enum attr = (Attrib::Enum)ii; if (_destDecl.has(attr) ) { ConvertOp& cop = convertOp[numOps]; cop.attr = attr; cop.dest = _destDecl.getOffset(attr); uint8_t num; AttribType::Enum type; bool normalized; bool asInt; _destDecl.decode(attr, num, type, normalized, asInt); cop.size = (*s_attribTypeSize[0])[type][num-1]; if (_srcDecl.has(attr) ) { cop.src = _srcDecl.getOffset(attr); cop.op = _destDecl.m_attributes[attr] == _srcDecl.m_attributes[attr] ? ConvertOp::Copy : ConvertOp::Convert; } else { cop.op = ConvertOp::Set; } ++numOps; } } if (0 < numOps) { const uint8_t* src = (const uint8_t*)_srcData; uint32_t srcStride = _srcDecl.getStride(); uint8_t* dest = (uint8_t*)_destData; uint32_t destStride = _destDecl.getStride(); float unpacked[4]; for (uint32_t ii = 0; ii < _num; ++ii) { for (uint32_t jj = 0; jj < numOps; ++jj) { const ConvertOp& cop = convertOp[jj]; switch (cop.op) { case ConvertOp::Set: memset(dest + cop.dest, 0, cop.size); break; case ConvertOp::Copy: memcpy(dest + cop.dest, src + cop.src, cop.size); break; case ConvertOp::Convert: vertexUnpack(unpacked, cop.attr, _srcDecl, src); vertexPack(unpacked, true, cop.attr, _destDecl, dest); break; } } src += srcStride; dest += destStride; } } } inline float sqLength(const float _a[3], const float _b[3]) { const float xx = _a[0] - _b[0]; const float yy = _a[1] - _b[1]; const float zz = _a[2] - _b[2]; return xx*xx + yy*yy + zz*zz; } uint16_t weldVerticesRef(uint16_t* _output, const VertexDecl& _decl, const void* _data, uint16_t _num, float _epsilon) { // Brute force slow vertex welding... const float epsilonSq = _epsilon*_epsilon; uint32_t numVertices = 0; memset(_output, 0xff, _num*sizeof(uint16_t) ); for (uint32_t ii = 0; ii < _num; ++ii) { if (UINT16_MAX != _output[ii]) { continue; } _output[ii] = (uint16_t)ii; ++numVertices; float pos[4]; vertexUnpack(pos, Attrib::Position, _decl, _data, ii); for (uint32_t jj = 0; jj < _num; ++jj) { if (UINT16_MAX != _output[jj]) { continue; } float test[4]; vertexUnpack(test, Attrib::Position, _decl, _data, jj); if (sqLength(test, pos) < epsilonSq) { _output[jj] = (uint16_t)ii; } } } return (uint16_t)numVertices; } uint16_t weldVertices(uint16_t* _output, const VertexDecl& _decl, const void* _data, uint16_t _num, float _epsilon) { const uint32_t hashSize = bx::uint32_nextpow2(_num); const uint32_t hashMask = hashSize-1; const float epsilonSq = _epsilon*_epsilon; uint32_t numVertices = 0; const uint32_t size = sizeof(uint16_t)*(hashSize + _num); uint16_t* hashTable = (uint16_t*)alloca(size); memset(hashTable, 0xff, size); uint16_t* next = hashTable + hashSize; for (uint32_t ii = 0; ii < _num; ++ii) { float pos[4]; vertexUnpack(pos, Attrib::Position, _decl, _data, ii); uint32_t hashValue = bx::hashMurmur2A(pos, 3*sizeof(float) ) & hashMask; uint16_t offset = hashTable[hashValue]; for (; UINT16_MAX != offset; offset = next[offset]) { float test[4]; vertexUnpack(test, Attrib::Position, _decl, _data, _output[offset]); if (sqLength(test, pos) < epsilonSq) { _output[ii] = _output[offset]; break; } } if (UINT16_MAX == offset) { _output[ii] = (uint16_t)ii; next[ii] = hashTable[hashValue]; hashTable[hashValue] = (uint16_t)ii; numVertices++; } } return (uint16_t)numVertices; } } // namespace bgfx