// // Copyright (c) 2014-2015 The ANGLE Project Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // // copyvertex.inc.h: Implementation of vertex buffer copying and conversion functions namespace rx { template inline void CopyNativeVertexData(const uint8_t *input, size_t stride, size_t count, uint8_t *output) { const size_t attribSize = sizeof(T) * inputComponentCount; if (attribSize == stride && inputComponentCount == outputComponentCount) { memcpy(output, input, count * attribSize); return; } if (inputComponentCount == outputComponentCount) { for (size_t i = 0; i < count; i++) { const T *offsetInput = reinterpret_cast(input + (i * stride)); T *offsetOutput = reinterpret_cast(output) + i * outputComponentCount; memcpy(offsetOutput, offsetInput, attribSize); } return; } const T defaultAlphaValue = gl::bitCast(alphaDefaultValueBits); const size_t lastNonAlphaOutputComponent = std::min(outputComponentCount, 3); for (size_t i = 0; i < count; i++) { const T *offsetInput = reinterpret_cast(input + (i * stride)); T *offsetOutput = reinterpret_cast(output) + i * outputComponentCount; memcpy(offsetOutput, offsetInput, attribSize); if (inputComponentCount < lastNonAlphaOutputComponent) { // Set the remaining G/B channels to 0. size_t numComponents = (lastNonAlphaOutputComponent - inputComponentCount); memset(&offsetOutput[inputComponentCount], 0, numComponents * sizeof(T)); } if (inputComponentCount < outputComponentCount && outputComponentCount == 4) { // Set the remaining alpha channel to the defaultAlphaValue. offsetOutput[3] = defaultAlphaValue; } } } template inline void Copy8SintTo16SintVertexData(const uint8_t *input, size_t stride, size_t count, uint8_t *output) { const size_t lastNonAlphaOutputComponent = std::min(outputComponentCount, 3); for (size_t i = 0; i < count; i++) { const GLbyte *offsetInput = reinterpret_cast(input + i * stride); GLshort *offsetOutput = reinterpret_cast(output) + i * outputComponentCount; for (size_t j = 0; j < inputComponentCount; j++) { offsetOutput[j] = static_cast(offsetInput[j]); } for (size_t j = inputComponentCount; j < lastNonAlphaOutputComponent; j++) { // Set remaining G/B channels to 0. offsetOutput[j] = 0; } if (inputComponentCount < outputComponentCount && outputComponentCount == 4) { // On integer formats, we must set the Alpha channel to 1 if it's unused. offsetOutput[3] = 1; } } } template inline void Copy8SnormTo16SnormVertexData(const uint8_t *input, size_t stride, size_t count, uint8_t *output) { for (size_t i = 0; i < count; i++) { const GLbyte *offsetInput = reinterpret_cast(input + i * stride); GLshort *offsetOutput = reinterpret_cast(output) + i * outputComponentCount; for (size_t j = 0; j < inputComponentCount; j++) { // The original GLbyte value ranges from -128 to +127 (INT8_MAX). // When converted to GLshort, the value must be scaled to between -32768 and +32767 // (INT16_MAX). if (offsetInput[j] > 0) { offsetOutput[j] = offsetInput[j] << 8 | offsetInput[j] << 1 | ((offsetInput[j] & 0x40) >> 6); } else { offsetOutput[j] = offsetInput[j] << 8; } } for (size_t j = inputComponentCount; j < std::min(outputComponentCount, 3); j++) { // Set remaining G/B channels to 0. offsetOutput[j] = 0; } if (inputComponentCount < outputComponentCount && outputComponentCount == 4) { // On normalized formats, we must set the Alpha channel to the max value if it's unused. offsetOutput[3] = INT16_MAX; } } } template inline void Copy32FixedTo32FVertexData(const uint8_t *input, size_t stride, size_t count, uint8_t *output) { static const float divisor = 1.0f / (1 << 16); for (size_t i = 0; i < count; i++) { const uint8_t *offsetInput = input + i * stride; float *offsetOutput = reinterpret_cast(output) + i * outputComponentCount; // GLfixed access must be 4-byte aligned on arm32, input and stride sometimes are not if (reinterpret_cast(offsetInput) % sizeof(GLfixed) == 0) { for (size_t j = 0; j < inputComponentCount; j++) { offsetOutput[j] = static_cast(reinterpret_cast(offsetInput)[j]) * divisor; } } else { for (size_t j = 0; j < inputComponentCount; j++) { GLfixed alignedInput; memcpy(&alignedInput, offsetInput + j * sizeof(GLfixed), sizeof(GLfixed)); offsetOutput[j] = static_cast(alignedInput) * divisor; } } // 4-component output formats would need special padding in the alpha channel. static_assert(!(inputComponentCount < 4 && outputComponentCount == 4), "An inputComponentCount less than 4 and an outputComponentCount equal to 4 " "is not supported."); for (size_t j = inputComponentCount; j < outputComponentCount; j++) { offsetOutput[j] = 0.0f; } } } template inline void CopyTo32FVertexData(const uint8_t *input, size_t stride, size_t count, uint8_t *output) { typedef std::numeric_limits NL; for (size_t i = 0; i < count; i++) { const T *offsetInput = reinterpret_cast(input + (stride * i)); float *offsetOutput = reinterpret_cast(output) + i * outputComponentCount; for (size_t j = 0; j < inputComponentCount; j++) { if (normalized) { if (NL::is_signed) { const float divisor = 1.0f / (2 * static_cast(NL::max()) + 1); offsetOutput[j] = (2 * static_cast(offsetInput[j]) + 1) * divisor; } else { offsetOutput[j] = static_cast(offsetInput[j]) / NL::max(); } } else { offsetOutput[j] = static_cast(offsetInput[j]); } } // This would require special padding. static_assert(!(inputComponentCount < 4 && outputComponentCount == 4), "An inputComponentCount less than 4 and an outputComponentCount equal to 4 " "is not supported."); for (size_t j = inputComponentCount; j < outputComponentCount; j++) { offsetOutput[j] = 0.0f; } } } namespace priv { template static inline void CopyPackedRGB(uint32_t data, uint8_t *output) { const uint32_t rgbSignMask = 0x200; // 1 set at the 9 bit const uint32_t negativeMask = 0xFFFFFC00; // All bits from 10 to 31 set to 1 if (toFloat) { GLfloat *floatOutput = reinterpret_cast(output); if (isSigned) { GLfloat finalValue = 0; if (data & rgbSignMask) { int negativeNumber = data | negativeMask; finalValue = static_cast(negativeNumber); } else { finalValue = static_cast(data); } if (normalized) { const int32_t maxValue = 0x1FF; // 1 set in bits 0 through 8 const int32_t minValue = 0xFFFFFE01; // Inverse of maxValue // A 10-bit two's complement number has the possibility of being minValue - 1 but // OpenGL's normalization rules dictate that it should be clamped to minValue in // this case. if (finalValue < minValue) { finalValue = minValue; } const int32_t halfRange = (maxValue - minValue) >> 1; *floatOutput = ((finalValue - minValue) / halfRange) - 1.0f; } else { *floatOutput = finalValue; } } else { if (normalized) { const uint32_t maxValue = 0x3FF; // 1 set in bits 0 through 9 *floatOutput = static_cast(data) / static_cast(maxValue); } else { *floatOutput = static_cast(data); } } } else { if (isSigned) { GLshort *intOutput = reinterpret_cast(output); if (data & rgbSignMask) { *intOutput = static_cast(data | negativeMask); } else { *intOutput = static_cast(data); } } else { GLushort *uintOutput = reinterpret_cast(output); *uintOutput = static_cast(data); } } } template inline void CopyPackedAlpha(uint32_t data, uint8_t *output) { if (toFloat) { GLfloat *floatOutput = reinterpret_cast(output); if (isSigned) { if (normalized) { switch (data) { case 0x0: *floatOutput = 0.0f; break; case 0x1: *floatOutput = 1.0f; break; case 0x2: *floatOutput = -1.0f; break; case 0x3: *floatOutput = -1.0f; break; default: UNREACHABLE(); } } else { switch (data) { case 0x0: *floatOutput = 0.0f; break; case 0x1: *floatOutput = 1.0f; break; case 0x2: *floatOutput = -2.0f; break; case 0x3: *floatOutput = -1.0f; break; default: UNREACHABLE(); } } } else { if (normalized) { switch (data) { case 0x0: *floatOutput = 0.0f / 3.0f; break; case 0x1: *floatOutput = 1.0f / 3.0f; break; case 0x2: *floatOutput = 2.0f / 3.0f; break; case 0x3: *floatOutput = 3.0f / 3.0f; break; default: UNREACHABLE(); } } else { switch (data) { case 0x0: *floatOutput = 0.0f; break; case 0x1: *floatOutput = 1.0f; break; case 0x2: *floatOutput = 2.0f; break; case 0x3: *floatOutput = 3.0f; break; default: UNREACHABLE(); } } } } else { if (isSigned) { GLshort *intOutput = reinterpret_cast(output); switch (data) { case 0x0: *intOutput = 0; break; case 0x1: *intOutput = 1; break; case 0x2: *intOutput = -2; break; case 0x3: *intOutput = -1; break; default: UNREACHABLE(); } } else { GLushort *uintOutput = reinterpret_cast(output); switch (data) { case 0x0: *uintOutput = 0; break; case 0x1: *uintOutput = 1; break; case 0x2: *uintOutput = 2; break; case 0x3: *uintOutput = 3; break; default: UNREACHABLE(); } } } } } // namespace priv template inline void CopyXYZ10W2ToXYZW32FVertexData(const uint8_t *input, size_t stride, size_t count, uint8_t *output) { const size_t outputComponentSize = toFloat ? 4 : 2; const size_t componentCount = 4; const uint32_t rgbMask = 0x3FF; // 1 set in bits 0 through 9 const size_t redShift = 0; // red is bits 0 through 9 const size_t greenShift = 10; // green is bits 10 through 19 const size_t blueShift = 20; // blue is bits 20 through 29 const uint32_t alphaMask = 0x3; // 1 set in bits 0 and 1 const size_t alphaShift = 30; // Alpha is the 30 and 31 bits for (size_t i = 0; i < count; i++) { GLuint packedValue = *reinterpret_cast(input + (i * stride)); uint8_t *offsetOutput = output + (i * outputComponentSize * componentCount); priv::CopyPackedRGB( (packedValue >> redShift) & rgbMask, offsetOutput + (0 * outputComponentSize)); priv::CopyPackedRGB( (packedValue >> greenShift) & rgbMask, offsetOutput + (1 * outputComponentSize)); priv::CopyPackedRGB( (packedValue >> blueShift) & rgbMask, offsetOutput + (2 * outputComponentSize)); priv::CopyPackedAlpha( (packedValue >> alphaShift) & alphaMask, offsetOutput + (3 * outputComponentSize)); } } } // namespace rx