/*------------------------------------------------------------------------- * drawElements Quality Program Tester Core * ---------------------------------------- * * Copyright 2014 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * *//*! * \file * \brief Compressed Texture Utilities. *//*--------------------------------------------------------------------*/ #include "tcuCompressedTexture.hpp" #include "tcuTextureUtil.hpp" #include "tcuAstcUtil.hpp" #include "deStringUtil.hpp" #include "deFloat16.h" #include namespace tcu { int getBlockSize (CompressedTexFormat format) { if (isAstcFormat(format)) { return astc::BLOCK_SIZE_BYTES; } else if (isEtcFormat(format)) { switch (format) { case COMPRESSEDTEXFORMAT_ETC1_RGB8: return 8; case COMPRESSEDTEXFORMAT_EAC_R11: return 8; case COMPRESSEDTEXFORMAT_EAC_SIGNED_R11: return 8; case COMPRESSEDTEXFORMAT_EAC_RG11: return 16; case COMPRESSEDTEXFORMAT_EAC_SIGNED_RG11: return 16; case COMPRESSEDTEXFORMAT_ETC2_RGB8: return 8; case COMPRESSEDTEXFORMAT_ETC2_SRGB8: return 8; case COMPRESSEDTEXFORMAT_ETC2_RGB8_PUNCHTHROUGH_ALPHA1: return 8; case COMPRESSEDTEXFORMAT_ETC2_SRGB8_PUNCHTHROUGH_ALPHA1: return 8; case COMPRESSEDTEXFORMAT_ETC2_EAC_RGBA8: return 16; case COMPRESSEDTEXFORMAT_ETC2_EAC_SRGB8_ALPHA8: return 16; default: DE_ASSERT(false); return -1; } } else if (isBcFormat(format)) { switch (format) { case COMPRESSEDTEXFORMAT_BC1_RGB_UNORM_BLOCK: return 8; case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK: return 8; case COMPRESSEDTEXFORMAT_BC1_RGBA_UNORM_BLOCK: return 8; case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK: return 8; case COMPRESSEDTEXFORMAT_BC2_UNORM_BLOCK: return 16; case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK: return 16; case COMPRESSEDTEXFORMAT_BC3_UNORM_BLOCK: return 16; case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK: return 16; case COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK: return 8; case COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK: return 8; case COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK: return 16; case COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK: return 16; case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK: return 16; case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK: return 16; case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK: return 16; case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: return 16; default: DE_ASSERT(false); return -1; } } else { DE_ASSERT(false); return -1; } } IVec3 getBlockPixelSize (CompressedTexFormat format) { if (isEtcFormat(format)) { return IVec3(4, 4, 1); } else if (isAstcFormat(format)) { switch (format) { case COMPRESSEDTEXFORMAT_ASTC_4x4_RGBA: return IVec3(4, 4, 1); case COMPRESSEDTEXFORMAT_ASTC_5x4_RGBA: return IVec3(5, 4, 1); case COMPRESSEDTEXFORMAT_ASTC_5x5_RGBA: return IVec3(5, 5, 1); case COMPRESSEDTEXFORMAT_ASTC_6x5_RGBA: return IVec3(6, 5, 1); case COMPRESSEDTEXFORMAT_ASTC_6x6_RGBA: return IVec3(6, 6, 1); case COMPRESSEDTEXFORMAT_ASTC_8x5_RGBA: return IVec3(8, 5, 1); case COMPRESSEDTEXFORMAT_ASTC_8x6_RGBA: return IVec3(8, 6, 1); case COMPRESSEDTEXFORMAT_ASTC_8x8_RGBA: return IVec3(8, 8, 1); case COMPRESSEDTEXFORMAT_ASTC_10x5_RGBA: return IVec3(10, 5, 1); case COMPRESSEDTEXFORMAT_ASTC_10x6_RGBA: return IVec3(10, 6, 1); case COMPRESSEDTEXFORMAT_ASTC_10x8_RGBA: return IVec3(10, 8, 1); case COMPRESSEDTEXFORMAT_ASTC_10x10_RGBA: return IVec3(10, 10, 1); case COMPRESSEDTEXFORMAT_ASTC_12x10_RGBA: return IVec3(12, 10, 1); case COMPRESSEDTEXFORMAT_ASTC_12x12_RGBA: return IVec3(12, 12, 1); case COMPRESSEDTEXFORMAT_ASTC_4x4_SRGB8_ALPHA8: return IVec3(4, 4, 1); case COMPRESSEDTEXFORMAT_ASTC_5x4_SRGB8_ALPHA8: return IVec3(5, 4, 1); case COMPRESSEDTEXFORMAT_ASTC_5x5_SRGB8_ALPHA8: return IVec3(5, 5, 1); case COMPRESSEDTEXFORMAT_ASTC_6x5_SRGB8_ALPHA8: return IVec3(6, 5, 1); case COMPRESSEDTEXFORMAT_ASTC_6x6_SRGB8_ALPHA8: return IVec3(6, 6, 1); case COMPRESSEDTEXFORMAT_ASTC_8x5_SRGB8_ALPHA8: return IVec3(8, 5, 1); case COMPRESSEDTEXFORMAT_ASTC_8x6_SRGB8_ALPHA8: return IVec3(8, 6, 1); case COMPRESSEDTEXFORMAT_ASTC_8x8_SRGB8_ALPHA8: return IVec3(8, 8, 1); case COMPRESSEDTEXFORMAT_ASTC_10x5_SRGB8_ALPHA8: return IVec3(10, 5, 1); case COMPRESSEDTEXFORMAT_ASTC_10x6_SRGB8_ALPHA8: return IVec3(10, 6, 1); case COMPRESSEDTEXFORMAT_ASTC_10x8_SRGB8_ALPHA8: return IVec3(10, 8, 1); case COMPRESSEDTEXFORMAT_ASTC_10x10_SRGB8_ALPHA8: return IVec3(10, 10, 1); case COMPRESSEDTEXFORMAT_ASTC_12x10_SRGB8_ALPHA8: return IVec3(12, 10, 1); case COMPRESSEDTEXFORMAT_ASTC_12x12_SRGB8_ALPHA8: return IVec3(12, 12, 1); default: DE_ASSERT(false); return IVec3(); } } else if (isBcFormat(format)) { return IVec3(4, 4, 1); } else { DE_ASSERT(false); return IVec3(-1); } } bool isEtcFormat (CompressedTexFormat format) { switch (format) { case COMPRESSEDTEXFORMAT_ETC1_RGB8: case COMPRESSEDTEXFORMAT_EAC_R11: case COMPRESSEDTEXFORMAT_EAC_SIGNED_R11: case COMPRESSEDTEXFORMAT_EAC_RG11: case COMPRESSEDTEXFORMAT_EAC_SIGNED_RG11: case COMPRESSEDTEXFORMAT_ETC2_RGB8: case COMPRESSEDTEXFORMAT_ETC2_SRGB8: case COMPRESSEDTEXFORMAT_ETC2_RGB8_PUNCHTHROUGH_ALPHA1: case COMPRESSEDTEXFORMAT_ETC2_SRGB8_PUNCHTHROUGH_ALPHA1: case COMPRESSEDTEXFORMAT_ETC2_EAC_RGBA8: case COMPRESSEDTEXFORMAT_ETC2_EAC_SRGB8_ALPHA8: return true; default: return false; } } bool isBcFormat (CompressedTexFormat format) { switch (format) { case COMPRESSEDTEXFORMAT_BC1_RGB_UNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK: case COMPRESSEDTEXFORMAT_BC1_RGBA_UNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK: case COMPRESSEDTEXFORMAT_BC2_UNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK: case COMPRESSEDTEXFORMAT_BC3_UNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK: case COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK: case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK: case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: return true; default: return false; } } bool isBcBitExactFormat (CompressedTexFormat format) { switch (format) { case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK: case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK: case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK: case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: return true; default: return false; } } bool isBcSRGBFormat (CompressedTexFormat format) { switch (format) { case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK: case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK: case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK: case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK: case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: return true; default: return false; } } bool isAstcFormat (CompressedTexFormat format) { switch (format) { case COMPRESSEDTEXFORMAT_ASTC_4x4_RGBA: case COMPRESSEDTEXFORMAT_ASTC_5x4_RGBA: case COMPRESSEDTEXFORMAT_ASTC_5x5_RGBA: case COMPRESSEDTEXFORMAT_ASTC_6x5_RGBA: case COMPRESSEDTEXFORMAT_ASTC_6x6_RGBA: case COMPRESSEDTEXFORMAT_ASTC_8x5_RGBA: case COMPRESSEDTEXFORMAT_ASTC_8x6_RGBA: case COMPRESSEDTEXFORMAT_ASTC_8x8_RGBA: case COMPRESSEDTEXFORMAT_ASTC_10x5_RGBA: case COMPRESSEDTEXFORMAT_ASTC_10x6_RGBA: case COMPRESSEDTEXFORMAT_ASTC_10x8_RGBA: case COMPRESSEDTEXFORMAT_ASTC_10x10_RGBA: case COMPRESSEDTEXFORMAT_ASTC_12x10_RGBA: case COMPRESSEDTEXFORMAT_ASTC_12x12_RGBA: case COMPRESSEDTEXFORMAT_ASTC_4x4_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_5x4_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_5x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_6x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_6x6_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_8x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_8x6_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_8x8_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x6_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x8_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x10_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_12x10_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_12x12_SRGB8_ALPHA8: return true; default: return false; } } bool isAstcSRGBFormat (CompressedTexFormat format) { switch (format) { case COMPRESSEDTEXFORMAT_ASTC_4x4_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_5x4_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_5x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_6x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_6x6_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_8x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_8x6_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_8x8_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x6_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x8_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x10_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_12x10_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_12x12_SRGB8_ALPHA8: return true; default: return false; } } TextureFormat getUncompressedFormat (CompressedTexFormat format) { if (isEtcFormat(format)) { switch (format) { case COMPRESSEDTEXFORMAT_ETC1_RGB8: return TextureFormat(TextureFormat::RGB, TextureFormat::UNORM_INT8); case COMPRESSEDTEXFORMAT_EAC_R11: return TextureFormat(TextureFormat::R, TextureFormat::UNORM_INT16); case COMPRESSEDTEXFORMAT_EAC_SIGNED_R11: return TextureFormat(TextureFormat::R, TextureFormat::SNORM_INT16); case COMPRESSEDTEXFORMAT_EAC_RG11: return TextureFormat(TextureFormat::RG, TextureFormat::UNORM_INT16); case COMPRESSEDTEXFORMAT_EAC_SIGNED_RG11: return TextureFormat(TextureFormat::RG, TextureFormat::SNORM_INT16); case COMPRESSEDTEXFORMAT_ETC2_RGB8: return TextureFormat(TextureFormat::RGB, TextureFormat::UNORM_INT8); case COMPRESSEDTEXFORMAT_ETC2_SRGB8: return TextureFormat(TextureFormat::sRGB, TextureFormat::UNORM_INT8); case COMPRESSEDTEXFORMAT_ETC2_RGB8_PUNCHTHROUGH_ALPHA1: return TextureFormat(TextureFormat::RGBA, TextureFormat::UNORM_INT8); case COMPRESSEDTEXFORMAT_ETC2_SRGB8_PUNCHTHROUGH_ALPHA1: return TextureFormat(TextureFormat::sRGBA, TextureFormat::UNORM_INT8); case COMPRESSEDTEXFORMAT_ETC2_EAC_RGBA8: return TextureFormat(TextureFormat::RGBA, TextureFormat::UNORM_INT8); case COMPRESSEDTEXFORMAT_ETC2_EAC_SRGB8_ALPHA8: return TextureFormat(TextureFormat::sRGBA, TextureFormat::UNORM_INT8); default: DE_ASSERT(false); return TextureFormat(); } } else if (isAstcFormat(format)) { if (isAstcSRGBFormat(format)) return TextureFormat(TextureFormat::sRGBA, TextureFormat::UNORM_INT8); else return TextureFormat(TextureFormat::RGBA, TextureFormat::HALF_FLOAT); } else if (isBcFormat(format)) { if (format == COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK || format == COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK) return TextureFormat(TextureFormat::R, TextureFormat::FLOAT); else if (format == COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK || format == COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK) return TextureFormat(TextureFormat::RG, TextureFormat::FLOAT); else if (format == COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK || format == COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK) return TextureFormat(TextureFormat::RGB, TextureFormat::HALF_FLOAT); else if (isBcSRGBFormat(format)) return TextureFormat(TextureFormat::sRGBA, TextureFormat::UNORM_INT8); else return TextureFormat(TextureFormat::RGBA, TextureFormat::UNORM_INT8); } else { DE_ASSERT(false); return TextureFormat(); } } CompressedTexFormat getAstcFormatByBlockSize (const IVec3& size, bool isSRGB) { if (size.z() > 1) throw InternalError("3D ASTC textures not currently supported"); for (int fmtI = 0; fmtI < COMPRESSEDTEXFORMAT_LAST; fmtI++) { const CompressedTexFormat fmt = (CompressedTexFormat)fmtI; if (isAstcFormat(fmt) && getBlockPixelSize(fmt) == size && isAstcSRGBFormat(fmt) == isSRGB) return fmt; } throw InternalError("Invalid ASTC block size " + de::toString(size.x()) + "x" + de::toString(size.y()) + "x" + de::toString(size.z())); } namespace { inline deUint8 extend4To8 (deUint8 src) { DE_ASSERT((src & ~((1<<4)-1)) == 0); return (deUint8)((src << 4) | src); } inline deUint8 extend5To8 (deUint8 src) { DE_ASSERT((src & ~((1<<5)-1)) == 0); return (deUint8)((src << 3) | (src >> 2)); } inline deUint8 extend6To8 (deUint8 src) { DE_ASSERT((src & ~((1<<6)-1)) == 0); return (deUint8)((src << 2) | (src >> 4)); } // \todo [2013-08-06 nuutti] ETC and ASTC decompression codes are rather unrelated, and are already in their own "private" namespaces - should this be split to multiple files? namespace EtcDecompressInternal { enum { ETC2_BLOCK_WIDTH = 4, ETC2_BLOCK_HEIGHT = 4, ETC2_UNCOMPRESSED_PIXEL_SIZE_A8 = 1, ETC2_UNCOMPRESSED_PIXEL_SIZE_R11 = 2, ETC2_UNCOMPRESSED_PIXEL_SIZE_RG11 = 4, ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8 = 3, ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8 = 4, ETC2_UNCOMPRESSED_BLOCK_SIZE_A8 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8, ETC2_UNCOMPRESSED_BLOCK_SIZE_R11 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11, ETC2_UNCOMPRESSED_BLOCK_SIZE_RG11 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_RG11, ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8, ETC2_UNCOMPRESSED_BLOCK_SIZE_RGBA8 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8 }; inline deUint64 get64BitBlock (const deUint8* src, int blockNdx) { // Stored in big-endian form. deUint64 block = 0; for (int i = 0; i < 8; i++) block = (block << 8ull) | (deUint64)(src[blockNdx*8+i]); return block; } // Return the first 64 bits of a 128 bit block. inline deUint64 get128BitBlockStart (const deUint8* src, int blockNdx) { return get64BitBlock(src, 2*blockNdx); } // Return the last 64 bits of a 128 bit block. inline deUint64 get128BitBlockEnd (const deUint8* src, int blockNdx) { return get64BitBlock(src, 2*blockNdx + 1); } inline deUint32 getBit (deUint64 src, int bit) { return (src >> bit) & 1; } inline deUint32 getBits (deUint64 src, int low, int high) { const int numBits = (high-low) + 1; DE_ASSERT(de::inRange(numBits, 1, 32)); if (numBits < 32) return (deUint32)((src >> low) & ((1u<> low) & 0xFFFFFFFFu); } inline deUint8 extend7To8 (deUint8 src) { DE_ASSERT((src & ~((1<<7)-1)) == 0); return (deUint8)((src << 1) | (src >> 6)); } inline deInt8 extendSigned3To8 (deUint8 src) { const bool isNeg = (src & (1<<2)) != 0; return (deInt8)((isNeg ? ~((1<<3)-1) : 0) | src); } inline deUint8 extend5Delta3To8 (deUint8 base5, deUint8 delta3) { const deUint8 t = (deUint8)((deInt8)base5 + extendSigned3To8(delta3)); return extend5To8(t); } inline deUint16 extend11To16 (deUint16 src) { DE_ASSERT((src & ~((1<<11)-1)) == 0); return (deUint16)((src << 5) | (src >> 6)); } inline deInt16 extend11To16WithSign (deInt16 src) { if (src < 0) return (deInt16)(-(deInt16)extend11To16((deUint16)(-src))); else return (deInt16)extend11To16(src); } void decompressETC1Block (deUint8 dst[ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8], deUint64 src) { const int diffBit = (int)getBit(src, 33); const int flipBit = (int)getBit(src, 32); const deUint32 table[2] = { getBits(src, 37, 39), getBits(src, 34, 36) }; deUint8 baseR[2]; deUint8 baseG[2]; deUint8 baseB[2]; if (diffBit == 0) { // Individual mode. baseR[0] = extend4To8((deUint8)getBits(src, 60, 63)); baseR[1] = extend4To8((deUint8)getBits(src, 56, 59)); baseG[0] = extend4To8((deUint8)getBits(src, 52, 55)); baseG[1] = extend4To8((deUint8)getBits(src, 48, 51)); baseB[0] = extend4To8((deUint8)getBits(src, 44, 47)); baseB[1] = extend4To8((deUint8)getBits(src, 40, 43)); } else { // Differential mode (diffBit == 1). deUint8 bR = (deUint8)getBits(src, 59, 63); // 5b deUint8 dR = (deUint8)getBits(src, 56, 58); // 3b deUint8 bG = (deUint8)getBits(src, 51, 55); deUint8 dG = (deUint8)getBits(src, 48, 50); deUint8 bB = (deUint8)getBits(src, 43, 47); deUint8 dB = (deUint8)getBits(src, 40, 42); baseR[0] = extend5To8(bR); baseG[0] = extend5To8(bG); baseB[0] = extend5To8(bB); baseR[1] = extend5Delta3To8(bR, dR); baseG[1] = extend5Delta3To8(bG, dG); baseB[1] = extend5Delta3To8(bB, dB); } static const int modifierTable[8][4] = { // 00 01 10 11 { 2, 8, -2, -8 }, { 5, 17, -5, -17 }, { 9, 29, -9, -29 }, { 13, 42, -13, -42 }, { 18, 60, -18, -60 }, { 24, 80, -24, -80 }, { 33, 106, -33, -106 }, { 47, 183, -47, -183 } }; // Write final pixels. for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) { const int x = pixelNdx / ETC2_BLOCK_HEIGHT; const int y = pixelNdx % ETC2_BLOCK_HEIGHT; const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8; const int subBlock = ((flipBit ? y : x) >= 2) ? 1 : 0; const deUint32 tableNdx = table[subBlock]; const deUint32 modifierNdx = (getBit(src, 16+pixelNdx) << 1) | getBit(src, pixelNdx); const int modifier = modifierTable[tableNdx][modifierNdx]; dst[dstOffset+0] = (deUint8)deClamp32((int)baseR[subBlock] + modifier, 0, 255); dst[dstOffset+1] = (deUint8)deClamp32((int)baseG[subBlock] + modifier, 0, 255); dst[dstOffset+2] = (deUint8)deClamp32((int)baseB[subBlock] + modifier, 0, 255); } } // if alphaMode is true, do PUNCHTHROUGH and store alpha to alphaDst; otherwise do ordinary ETC2 RGB8. void decompressETC2Block (deUint8 dst[ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8], deUint64 src, deUint8 alphaDst[ETC2_UNCOMPRESSED_BLOCK_SIZE_A8], bool alphaMode) { enum Etc2Mode { MODE_INDIVIDUAL = 0, MODE_DIFFERENTIAL, MODE_T, MODE_H, MODE_PLANAR, MODE_LAST }; const int diffOpaqueBit = (int)getBit(src, 33); const deInt8 selBR = (deInt8)getBits(src, 59, 63); // 5 bits. const deInt8 selBG = (deInt8)getBits(src, 51, 55); const deInt8 selBB = (deInt8)getBits(src, 43, 47); const deInt8 selDR = extendSigned3To8((deUint8)getBits(src, 56, 58)); // 3 bits. const deInt8 selDG = extendSigned3To8((deUint8)getBits(src, 48, 50)); const deInt8 selDB = extendSigned3To8((deUint8)getBits(src, 40, 42)); Etc2Mode mode; if (!alphaMode && diffOpaqueBit == 0) mode = MODE_INDIVIDUAL; else if (!de::inRange(selBR + selDR, 0, 31)) mode = MODE_T; else if (!de::inRange(selBG + selDG, 0, 31)) mode = MODE_H; else if (!de::inRange(selBB + selDB, 0, 31)) mode = MODE_PLANAR; else mode = MODE_DIFFERENTIAL; if (mode == MODE_INDIVIDUAL || mode == MODE_DIFFERENTIAL) { // Individual and differential modes have some steps in common, handle them here. static const int modifierTable[8][4] = { // 00 01 10 11 { 2, 8, -2, -8 }, { 5, 17, -5, -17 }, { 9, 29, -9, -29 }, { 13, 42, -13, -42 }, { 18, 60, -18, -60 }, { 24, 80, -24, -80 }, { 33, 106, -33, -106 }, { 47, 183, -47, -183 } }; const int flipBit = (int)getBit(src, 32); const deUint32 table[2] = { getBits(src, 37, 39), getBits(src, 34, 36) }; deUint8 baseR[2]; deUint8 baseG[2]; deUint8 baseB[2]; if (mode == MODE_INDIVIDUAL) { // Individual mode, initial values. baseR[0] = extend4To8((deUint8)getBits(src, 60, 63)); baseR[1] = extend4To8((deUint8)getBits(src, 56, 59)); baseG[0] = extend4To8((deUint8)getBits(src, 52, 55)); baseG[1] = extend4To8((deUint8)getBits(src, 48, 51)); baseB[0] = extend4To8((deUint8)getBits(src, 44, 47)); baseB[1] = extend4To8((deUint8)getBits(src, 40, 43)); } else { // Differential mode, initial values. baseR[0] = extend5To8(selBR); baseG[0] = extend5To8(selBG); baseB[0] = extend5To8(selBB); baseR[1] = extend5To8((deUint8)(selBR + selDR)); baseG[1] = extend5To8((deUint8)(selBG + selDG)); baseB[1] = extend5To8((deUint8)(selBB + selDB)); } // Write final pixels for individual or differential mode. for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) { const int x = pixelNdx / ETC2_BLOCK_HEIGHT; const int y = pixelNdx % ETC2_BLOCK_HEIGHT; const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8; const int subBlock = ((flipBit ? y : x) >= 2) ? 1 : 0; const deUint32 tableNdx = table[subBlock]; const deUint32 modifierNdx = (getBit(src, 16+pixelNdx) << 1) | getBit(src, pixelNdx); const int alphaDstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8; // Only needed for PUNCHTHROUGH version. // If doing PUNCHTHROUGH version (alphaMode), opaque bit may affect colors. if (alphaMode && diffOpaqueBit == 0 && modifierNdx == 2) { dst[dstOffset+0] = 0; dst[dstOffset+1] = 0; dst[dstOffset+2] = 0; alphaDst[alphaDstOffset] = 0; } else { int modifier; // PUNCHTHROUGH version and opaque bit may also affect modifiers. if (alphaMode && diffOpaqueBit == 0 && (modifierNdx == 0 || modifierNdx == 2)) modifier = 0; else modifier = modifierTable[tableNdx][modifierNdx]; dst[dstOffset+0] = (deUint8)deClamp32((int)baseR[subBlock] + modifier, 0, 255); dst[dstOffset+1] = (deUint8)deClamp32((int)baseG[subBlock] + modifier, 0, 255); dst[dstOffset+2] = (deUint8)deClamp32((int)baseB[subBlock] + modifier, 0, 255); if (alphaMode) alphaDst[alphaDstOffset] = 255; } } } else if (mode == MODE_T || mode == MODE_H) { // T and H modes have some steps in common, handle them here. static const int distTable[8] = { 3, 6, 11, 16, 23, 32, 41, 64 }; deUint8 paintR[4]; deUint8 paintG[4]; deUint8 paintB[4]; if (mode == MODE_T) { // T mode, calculate paint values. const deUint8 R1a = (deUint8)getBits(src, 59, 60); const deUint8 R1b = (deUint8)getBits(src, 56, 57); const deUint8 G1 = (deUint8)getBits(src, 52, 55); const deUint8 B1 = (deUint8)getBits(src, 48, 51); const deUint8 R2 = (deUint8)getBits(src, 44, 47); const deUint8 G2 = (deUint8)getBits(src, 40, 43); const deUint8 B2 = (deUint8)getBits(src, 36, 39); const deUint32 distNdx = (getBits(src, 34, 35) << 1) | getBit(src, 32); const int dist = distTable[distNdx]; paintR[0] = extend4To8((deUint8)((R1a << 2) | R1b)); paintG[0] = extend4To8(G1); paintB[0] = extend4To8(B1); paintR[2] = extend4To8(R2); paintG[2] = extend4To8(G2); paintB[2] = extend4To8(B2); paintR[1] = (deUint8)deClamp32((int)paintR[2] + dist, 0, 255); paintG[1] = (deUint8)deClamp32((int)paintG[2] + dist, 0, 255); paintB[1] = (deUint8)deClamp32((int)paintB[2] + dist, 0, 255); paintR[3] = (deUint8)deClamp32((int)paintR[2] - dist, 0, 255); paintG[3] = (deUint8)deClamp32((int)paintG[2] - dist, 0, 255); paintB[3] = (deUint8)deClamp32((int)paintB[2] - dist, 0, 255); } else { // H mode, calculate paint values. const deUint8 R1 = (deUint8)getBits(src, 59, 62); const deUint8 G1a = (deUint8)getBits(src, 56, 58); const deUint8 G1b = (deUint8)getBit(src, 52); const deUint8 B1a = (deUint8)getBit(src, 51); const deUint8 B1b = (deUint8)getBits(src, 47, 49); const deUint8 R2 = (deUint8)getBits(src, 43, 46); const deUint8 G2 = (deUint8)getBits(src, 39, 42); const deUint8 B2 = (deUint8)getBits(src, 35, 38); deUint8 baseR[2]; deUint8 baseG[2]; deUint8 baseB[2]; deUint32 baseValue[2]; deUint32 distNdx; int dist; baseR[0] = extend4To8(R1); baseG[0] = extend4To8((deUint8)((G1a << 1) | G1b)); baseB[0] = extend4To8((deUint8)((B1a << 3) | B1b)); baseR[1] = extend4To8(R2); baseG[1] = extend4To8(G2); baseB[1] = extend4To8(B2); baseValue[0] = (((deUint32)baseR[0]) << 16) | (((deUint32)baseG[0]) << 8) | baseB[0]; baseValue[1] = (((deUint32)baseR[1]) << 16) | (((deUint32)baseG[1]) << 8) | baseB[1]; distNdx = (getBit(src, 34) << 2) | (getBit(src, 32) << 1) | (deUint32)(baseValue[0] >= baseValue[1]); dist = distTable[distNdx]; paintR[0] = (deUint8)deClamp32((int)baseR[0] + dist, 0, 255); paintG[0] = (deUint8)deClamp32((int)baseG[0] + dist, 0, 255); paintB[0] = (deUint8)deClamp32((int)baseB[0] + dist, 0, 255); paintR[1] = (deUint8)deClamp32((int)baseR[0] - dist, 0, 255); paintG[1] = (deUint8)deClamp32((int)baseG[0] - dist, 0, 255); paintB[1] = (deUint8)deClamp32((int)baseB[0] - dist, 0, 255); paintR[2] = (deUint8)deClamp32((int)baseR[1] + dist, 0, 255); paintG[2] = (deUint8)deClamp32((int)baseG[1] + dist, 0, 255); paintB[2] = (deUint8)deClamp32((int)baseB[1] + dist, 0, 255); paintR[3] = (deUint8)deClamp32((int)baseR[1] - dist, 0, 255); paintG[3] = (deUint8)deClamp32((int)baseG[1] - dist, 0, 255); paintB[3] = (deUint8)deClamp32((int)baseB[1] - dist, 0, 255); } // Write final pixels for T or H mode. for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) { const int x = pixelNdx / ETC2_BLOCK_HEIGHT; const int y = pixelNdx % ETC2_BLOCK_HEIGHT; const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8; const deUint32 paintNdx = (getBit(src, 16+pixelNdx) << 1) | getBit(src, pixelNdx); const int alphaDstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8; // Only needed for PUNCHTHROUGH version. if (alphaMode && diffOpaqueBit == 0 && paintNdx == 2) { dst[dstOffset+0] = 0; dst[dstOffset+1] = 0; dst[dstOffset+2] = 0; alphaDst[alphaDstOffset] = 0; } else { dst[dstOffset+0] = (deUint8)deClamp32((int)paintR[paintNdx], 0, 255); dst[dstOffset+1] = (deUint8)deClamp32((int)paintG[paintNdx], 0, 255); dst[dstOffset+2] = (deUint8)deClamp32((int)paintB[paintNdx], 0, 255); if (alphaMode) alphaDst[alphaDstOffset] = 255; } } } else { // Planar mode. const deUint8 GO1 = (deUint8)getBit(src, 56); const deUint8 GO2 = (deUint8)getBits(src, 49, 54); const deUint8 BO1 = (deUint8)getBit(src, 48); const deUint8 BO2 = (deUint8)getBits(src, 43, 44); const deUint8 BO3 = (deUint8)getBits(src, 39, 41); const deUint8 RH1 = (deUint8)getBits(src, 34, 38); const deUint8 RH2 = (deUint8)getBit(src, 32); const deUint8 RO = extend6To8((deUint8)getBits(src, 57, 62)); const deUint8 GO = extend7To8((deUint8)((GO1 << 6) | GO2)); const deUint8 BO = extend6To8((deUint8)((BO1 << 5) | (BO2 << 3) | BO3)); const deUint8 RH = extend6To8((deUint8)((RH1 << 1) | RH2)); const deUint8 GH = extend7To8((deUint8)getBits(src, 25, 31)); const deUint8 BH = extend6To8((deUint8)getBits(src, 19, 24)); const deUint8 RV = extend6To8((deUint8)getBits(src, 13, 18)); const deUint8 GV = extend7To8((deUint8)getBits(src, 6, 12)); const deUint8 BV = extend6To8((deUint8)getBits(src, 0, 5)); // Write final pixels for planar mode. for (int y = 0; y < 4; y++) { for (int x = 0; x < 4; x++) { const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8; const int unclampedR = (x * ((int)RH-(int)RO) + y * ((int)RV-(int)RO) + 4*(int)RO + 2) >> 2; const int unclampedG = (x * ((int)GH-(int)GO) + y * ((int)GV-(int)GO) + 4*(int)GO + 2) >> 2; const int unclampedB = (x * ((int)BH-(int)BO) + y * ((int)BV-(int)BO) + 4*(int)BO + 2) >> 2; const int alphaDstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8; // Only needed for PUNCHTHROUGH version. dst[dstOffset+0] = (deUint8)deClamp32(unclampedR, 0, 255); dst[dstOffset+1] = (deUint8)deClamp32(unclampedG, 0, 255); dst[dstOffset+2] = (deUint8)deClamp32(unclampedB, 0, 255); if (alphaMode) alphaDst[alphaDstOffset] = 255; } } } } void decompressEAC8Block (deUint8 dst[ETC2_UNCOMPRESSED_BLOCK_SIZE_A8], deUint64 src) { static const int modifierTable[16][8] = { {-3, -6, -9, -15, 2, 5, 8, 14}, {-3, -7, -10, -13, 2, 6, 9, 12}, {-2, -5, -8, -13, 1, 4, 7, 12}, {-2, -4, -6, -13, 1, 3, 5, 12}, {-3, -6, -8, -12, 2, 5, 7, 11}, {-3, -7, -9, -11, 2, 6, 8, 10}, {-4, -7, -8, -11, 3, 6, 7, 10}, {-3, -5, -8, -11, 2, 4, 7, 10}, {-2, -6, -8, -10, 1, 5, 7, 9}, {-2, -5, -8, -10, 1, 4, 7, 9}, {-2, -4, -8, -10, 1, 3, 7, 9}, {-2, -5, -7, -10, 1, 4, 6, 9}, {-3, -4, -7, -10, 2, 3, 6, 9}, {-1, -2, -3, -10, 0, 1, 2, 9}, {-4, -6, -8, -9, 3, 5, 7, 8}, {-3, -5, -7, -9, 2, 4, 6, 8} }; const deUint8 baseCodeword = (deUint8)getBits(src, 56, 63); const deUint8 multiplier = (deUint8)getBits(src, 52, 55); const deUint32 tableNdx = getBits(src, 48, 51); for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) { const int x = pixelNdx / ETC2_BLOCK_HEIGHT; const int y = pixelNdx % ETC2_BLOCK_HEIGHT; const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8; const int pixelBitNdx = 45 - 3*pixelNdx; const deUint32 modifierNdx = (getBit(src, pixelBitNdx + 2) << 2) | (getBit(src, pixelBitNdx + 1) << 1) | getBit(src, pixelBitNdx); const int modifier = modifierTable[tableNdx][modifierNdx]; dst[dstOffset] = (deUint8)deClamp32((int)baseCodeword + (int)multiplier*modifier, 0, 255); } } void decompressEAC11Block (deUint8 dst[ETC2_UNCOMPRESSED_BLOCK_SIZE_R11], deUint64 src, bool signedMode) { static const int modifierTable[16][8] = { {-3, -6, -9, -15, 2, 5, 8, 14}, {-3, -7, -10, -13, 2, 6, 9, 12}, {-2, -5, -8, -13, 1, 4, 7, 12}, {-2, -4, -6, -13, 1, 3, 5, 12}, {-3, -6, -8, -12, 2, 5, 7, 11}, {-3, -7, -9, -11, 2, 6, 8, 10}, {-4, -7, -8, -11, 3, 6, 7, 10}, {-3, -5, -8, -11, 2, 4, 7, 10}, {-2, -6, -8, -10, 1, 5, 7, 9}, {-2, -5, -8, -10, 1, 4, 7, 9}, {-2, -4, -8, -10, 1, 3, 7, 9}, {-2, -5, -7, -10, 1, 4, 6, 9}, {-3, -4, -7, -10, 2, 3, 6, 9}, {-1, -2, -3, -10, 0, 1, 2, 9}, {-4, -6, -8, -9, 3, 5, 7, 8}, {-3, -5, -7, -9, 2, 4, 6, 8} }; const deInt32 multiplier = (deInt32)getBits(src, 52, 55); const deInt32 tableNdx = (deInt32)getBits(src, 48, 51); deInt32 baseCodeword = (deInt32)getBits(src, 56, 63); if (signedMode) { if (baseCodeword > 127) baseCodeword -= 256; if (baseCodeword == -128) baseCodeword = -127; } for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) { const int x = pixelNdx / ETC2_BLOCK_HEIGHT; const int y = pixelNdx % ETC2_BLOCK_HEIGHT; const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11; const int pixelBitNdx = 45 - 3*pixelNdx; const deUint32 modifierNdx = (getBit(src, pixelBitNdx + 2) << 2) | (getBit(src, pixelBitNdx + 1) << 1) | getBit(src, pixelBitNdx); const int modifier = modifierTable[tableNdx][modifierNdx]; if (signedMode) { deInt16 value; if (multiplier != 0) value = (deInt16)deClamp32(baseCodeword*8 + multiplier*modifier*8, -1023, 1023); else value = (deInt16)deClamp32(baseCodeword*8 + modifier, -1023, 1023); *((deInt16*)(dst + dstOffset)) = value; } else { deUint16 value; if (multiplier != 0) value = (deUint16)deClamp32(baseCodeword*8 + 4 + multiplier*modifier*8, 0, 2047); else value= (deUint16)deClamp32(baseCodeword*8 + 4 + modifier, 0, 2047); *((deUint16*)(dst + dstOffset)) = value; } } } } // EtcDecompressInternal void decompressETC1 (const PixelBufferAccess& dst, const deUint8* src) { using namespace EtcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const deUint64 compressedBlock = get64BitBlock(src, 0); decompressETC1Block(dstPtr, compressedBlock); } void decompressETC2 (const PixelBufferAccess& dst, const deUint8* src) { using namespace EtcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const deUint64 compressedBlock = get64BitBlock(src, 0); decompressETC2Block(dstPtr, compressedBlock, NULL, false); } void decompressETC2_EAC_RGBA8 (const PixelBufferAccess& dst, const deUint8* src) { using namespace EtcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const int dstRowPitch = dst.getRowPitch(); const int dstPixelSize = ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8; const deUint64 compressedBlockAlpha = get128BitBlockStart(src, 0); const deUint64 compressedBlockRGB = get128BitBlockEnd(src, 0); deUint8 uncompressedBlockAlpha[ETC2_UNCOMPRESSED_BLOCK_SIZE_A8]; deUint8 uncompressedBlockRGB[ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8]; // Decompress. decompressETC2Block(uncompressedBlockRGB, compressedBlockRGB, NULL, false); decompressEAC8Block(uncompressedBlockAlpha, compressedBlockAlpha); // Write to dst. for (int y = 0; y < (int)ETC2_BLOCK_HEIGHT; y++) { for (int x = 0; x < (int)ETC2_BLOCK_WIDTH; x++) { const deUint8* const srcPixelRGB = &uncompressedBlockRGB[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8]; const deUint8* const srcPixelAlpha = &uncompressedBlockAlpha[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8]; deUint8* const dstPixel = dstPtr + y*dstRowPitch + x*dstPixelSize; DE_STATIC_ASSERT(ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8 == 4); dstPixel[0] = srcPixelRGB[0]; dstPixel[1] = srcPixelRGB[1]; dstPixel[2] = srcPixelRGB[2]; dstPixel[3] = srcPixelAlpha[0]; } } } void decompressETC2_RGB8_PUNCHTHROUGH_ALPHA1 (const PixelBufferAccess& dst, const deUint8* src) { using namespace EtcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const int dstRowPitch = dst.getRowPitch(); const int dstPixelSize = ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8; const deUint64 compressedBlockRGBA = get64BitBlock(src, 0); deUint8 uncompressedBlockRGB[ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8]; deUint8 uncompressedBlockAlpha[ETC2_UNCOMPRESSED_BLOCK_SIZE_A8]; // Decompress. decompressETC2Block(uncompressedBlockRGB, compressedBlockRGBA, uncompressedBlockAlpha, DE_TRUE); // Write to dst. for (int y = 0; y < (int)ETC2_BLOCK_HEIGHT; y++) { for (int x = 0; x < (int)ETC2_BLOCK_WIDTH; x++) { const deUint8* const srcPixel = &uncompressedBlockRGB[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8]; const deUint8* const srcPixelAlpha = &uncompressedBlockAlpha[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8]; deUint8* const dstPixel = dstPtr + y*dstRowPitch + x*dstPixelSize; DE_STATIC_ASSERT(ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8 == 4); dstPixel[0] = srcPixel[0]; dstPixel[1] = srcPixel[1]; dstPixel[2] = srcPixel[2]; dstPixel[3] = srcPixelAlpha[0]; } } } void decompressEAC_R11 (const PixelBufferAccess& dst, const deUint8* src, bool signedMode) { using namespace EtcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const int dstRowPitch = dst.getRowPitch(); const int dstPixelSize = ETC2_UNCOMPRESSED_PIXEL_SIZE_R11; const deUint64 compressedBlock = get64BitBlock(src, 0); deUint8 uncompressedBlock[ETC2_UNCOMPRESSED_BLOCK_SIZE_R11]; // Decompress. decompressEAC11Block(uncompressedBlock, compressedBlock, signedMode); // Write to dst. for (int y = 0; y < (int)ETC2_BLOCK_HEIGHT; y++) { for (int x = 0; x < (int)ETC2_BLOCK_WIDTH; x++) { DE_STATIC_ASSERT(ETC2_UNCOMPRESSED_PIXEL_SIZE_R11 == 2); if (signedMode) { const deInt16* const srcPixel = (deInt16*)&uncompressedBlock[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; deInt16* const dstPixel = (deInt16*)(dstPtr + y*dstRowPitch + x*dstPixelSize); dstPixel[0] = extend11To16WithSign(srcPixel[0]); } else { const deUint16* const srcPixel = (deUint16*)&uncompressedBlock[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; deUint16* const dstPixel = (deUint16*)(dstPtr + y*dstRowPitch + x*dstPixelSize); dstPixel[0] = extend11To16(srcPixel[0]); } } } } void decompressEAC_RG11 (const PixelBufferAccess& dst, const deUint8* src, bool signedMode) { using namespace EtcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const int dstRowPitch = dst.getRowPitch(); const int dstPixelSize = ETC2_UNCOMPRESSED_PIXEL_SIZE_RG11; const deUint64 compressedBlockR = get128BitBlockStart(src, 0); const deUint64 compressedBlockG = get128BitBlockEnd(src, 0); deUint8 uncompressedBlockR[ETC2_UNCOMPRESSED_BLOCK_SIZE_R11]; deUint8 uncompressedBlockG[ETC2_UNCOMPRESSED_BLOCK_SIZE_R11]; // Decompress. decompressEAC11Block(uncompressedBlockR, compressedBlockR, signedMode); decompressEAC11Block(uncompressedBlockG, compressedBlockG, signedMode); // Write to dst. for (int y = 0; y < (int)ETC2_BLOCK_HEIGHT; y++) { for (int x = 0; x < (int)ETC2_BLOCK_WIDTH; x++) { DE_STATIC_ASSERT(ETC2_UNCOMPRESSED_PIXEL_SIZE_RG11 == 4); if (signedMode) { const deInt16* const srcPixelR = (deInt16*)&uncompressedBlockR[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; const deInt16* const srcPixelG = (deInt16*)&uncompressedBlockG[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; deInt16* const dstPixel = (deInt16*)(dstPtr + y*dstRowPitch + x*dstPixelSize); dstPixel[0] = extend11To16WithSign(srcPixelR[0]); dstPixel[1] = extend11To16WithSign(srcPixelG[0]); } else { const deUint16* const srcPixelR = (deUint16*)&uncompressedBlockR[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; const deUint16* const srcPixelG = (deUint16*)&uncompressedBlockG[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; deUint16* const dstPixel = (deUint16*)(dstPtr + y*dstRowPitch + x*dstPixelSize); dstPixel[0] = extend11To16(srcPixelR[0]); dstPixel[1] = extend11To16(srcPixelG[0]); } } } } namespace BcDecompressInternal { enum { BC_BLOCK_WIDTH = 4, BC_BLOCK_HEIGHT = 4 }; static const deUint8 epBits[14] = { 10, 7, 11, 11, 11, 9, 8, 8, 8, 6, 10, 11, 12, 16 }; static const deUint8 partitions2[64][16] = { { 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1 }, { 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1 }, { 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1 }, { 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1 }, { 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1 }, { 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1 }, { 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1 }, { 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1 }, { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1 }, { 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 }, { 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1 }, { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1 }, { 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 }, { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1 }, { 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 }, { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1 }, { 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1 }, { 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 }, { 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0 }, { 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0 }, { 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 }, { 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0 }, { 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0 }, { 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1 }, { 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0 }, { 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0 }, { 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0 }, { 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0 }, { 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0 }, { 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0 }, { 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0 }, { 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0 }, { 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1 }, { 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1 }, { 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0 }, { 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0 }, { 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0 }, { 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0 }, { 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1 }, { 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1 }, { 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0 }, { 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0 }, { 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0 }, { 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0 }, { 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0 }, { 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1 }, { 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1 }, { 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0 }, { 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0 }, { 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0 }, { 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0 }, { 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0 }, { 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1 }, { 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1 }, { 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0 }, { 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0 }, { 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1 }, { 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1 }, { 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1 }, { 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1 }, { 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1 }, { 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0 }, { 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0 }, { 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1 } }; static const deUint8 partitions3[64][16] = { { 0, 0, 1, 1, 0, 0, 1, 1, 0, 2, 2, 1, 2, 2, 2, 2 }, { 0, 0, 0, 1, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2, 2, 1 }, { 0, 0, 0, 0, 2, 0, 0, 1, 2, 2, 1, 1, 2, 2, 1, 1 }, { 0, 2, 2, 2, 0, 0, 2, 2, 0, 0, 1, 1, 0, 1, 1, 1 }, { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2 }, { 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 2, 2, 0, 0, 2, 2 }, { 0, 0, 2, 2, 0, 0, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1 }, { 0, 0, 1, 1, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2, 1, 1 }, { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2 }, { 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2 }, { 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2 }, { 0, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2 }, { 0, 1, 1, 2, 0, 1, 1, 2, 0, 1, 1, 2, 0, 1, 1, 2 }, { 0, 1, 2, 2, 0, 1, 2, 2, 0, 1, 2, 2, 0, 1, 2, 2 }, { 0, 0, 1, 1, 0, 1, 1, 2, 1, 1, 2, 2, 1, 2, 2, 2 }, { 0, 0, 1, 1, 2, 0, 0, 1, 2, 2, 0, 0, 2, 2, 2, 0 }, { 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 2, 1, 1, 2, 2 }, { 0, 1, 1, 1, 0, 0, 1, 1, 2, 0, 0, 1, 2, 2, 0, 0 }, { 0, 0, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2, 1, 1, 2, 2 }, { 0, 0, 2, 2, 0, 0, 2, 2, 0, 0, 2, 2, 1, 1, 1, 1 }, { 0, 1, 1, 1, 0, 1, 1, 1, 0, 2, 2, 2, 0, 2, 2, 2 }, { 0, 0, 0, 1, 0, 0, 0, 1, 2, 2, 2, 1, 2, 2, 2, 1 }, { 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 2, 2, 0, 1, 2, 2 }, { 0, 0, 0, 0, 1, 1, 0, 0, 2, 2, 1, 0, 2, 2, 1, 0 }, { 0, 1, 2, 2, 0, 1, 2, 2, 0, 0, 1, 1, 0, 0, 0, 0 }, { 0, 0, 1, 2, 0, 0, 1, 2, 1, 1, 2, 2, 2, 2, 2, 2 }, { 0, 1, 1, 0, 1, 2, 2, 1, 1, 2, 2, 1, 0, 1, 1, 0 }, { 0, 0, 0, 0, 0, 1, 1, 0, 1, 2, 2, 1, 1, 2, 2, 1 }, { 0, 0, 2, 2, 1, 1, 0, 2, 1, 1, 0, 2, 0, 0, 2, 2 }, { 0, 1, 1, 0, 0, 1, 1, 0, 2, 0, 0, 2, 2, 2, 2, 2 }, { 0, 0, 1, 1, 0, 1, 2, 2, 0, 1, 2, 2, 0, 0, 1, 1 }, { 0, 0, 0, 0, 2, 0, 0, 0, 2, 2, 1, 1, 2, 2, 2, 1 }, { 0, 0, 0, 0, 0, 0, 0, 2, 1, 1, 2, 2, 1, 2, 2, 2 }, { 0, 2, 2, 2, 0, 0, 2, 2, 0, 0, 1, 2, 0, 0, 1, 1 }, { 0, 0, 1, 1, 0, 0, 1, 2, 0, 0, 2, 2, 0, 2, 2, 2 }, { 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2, 0 }, { 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 0, 0, 0, 0 }, { 0, 1, 2, 0, 1, 2, 0, 1, 2, 0, 1, 2, 0, 1, 2, 0 }, { 0, 1, 2, 0, 2, 0, 1, 2, 1, 2, 0, 1, 0, 1, 2, 0 }, { 0, 0, 1, 1, 2, 2, 0, 0, 1, 1, 2, 2, 0, 0, 1, 1 }, { 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 0, 0, 0, 0, 1, 1 }, { 0, 1, 0, 1, 0, 1, 0, 1, 2, 2, 2, 2, 2, 2, 2, 2 }, { 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 2, 1, 2, 1, 2, 1 }, { 0, 0, 2, 2, 1, 1, 2, 2, 0, 0, 2, 2, 1, 1, 2, 2 }, { 0, 0, 2, 2, 0, 0, 1, 1, 0, 0, 2, 2, 0, 0, 1, 1 }, { 0, 2, 2, 0, 1, 2, 2, 1, 0, 2, 2, 0, 1, 2, 2, 1 }, { 0, 1, 0, 1, 2, 2, 2, 2, 2, 2, 2, 2, 0, 1, 0, 1 }, { 0, 0, 0, 0, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1 }, { 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 2, 2, 2, 2 }, { 0, 2, 2, 2, 0, 1, 1, 1, 0, 2, 2, 2, 0, 1, 1, 1 }, { 0, 0, 0, 2, 1, 1, 1, 2, 0, 0, 0, 2, 1, 1, 1, 2 }, { 0, 0, 0, 0, 2, 1, 1, 2, 2, 1, 1, 2, 2, 1, 1, 2 }, { 0, 2, 2, 2, 0, 1, 1, 1, 0, 1, 1, 1, 0, 2, 2, 2 }, { 0, 0, 0, 2, 1, 1, 1, 2, 1, 1, 1, 2, 0, 0, 0, 2 }, { 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 2, 2, 2, 2 }, { 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 1, 2, 2, 1, 1, 2 }, { 0, 1, 1, 0, 0, 1, 1, 0, 2, 2, 2, 2, 2, 2, 2, 2 }, { 0, 0, 2, 2, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 2, 2 }, { 0, 0, 2, 2, 1, 1, 2, 2, 1, 1, 2, 2, 0, 0, 2, 2 }, { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 1, 2 }, { 0, 0, 0, 2, 0, 0, 0, 1, 0, 0, 0, 2, 0, 0, 0, 1 }, { 0, 2, 2, 2, 1, 2, 2, 2, 0, 2, 2, 2, 1, 2, 2, 2 }, { 0, 1, 0, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2 }, { 0, 1, 1, 1, 2, 0, 1, 1, 2, 2, 0, 1, 2, 2, 2, 0 } }; static const deUint8 anchorIndicesSecondSubset2[64] = { 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 2, 8, 2, 2, 8, 8, 15, 2, 8, 2, 2, 8, 8, 2, 2, 15, 15, 6, 8, 2, 8, 15, 15, 2, 8, 2, 2, 2, 15, 15, 6, 6, 2, 6, 8, 15, 15, 2, 2, 15, 15, 15, 15, 15, 2, 2, 15 }; static const deUint8 anchorIndicesSecondSubset3[64] = { 3, 3, 15, 15, 8, 3, 15, 15, 8, 8, 6, 6, 6, 5, 3, 3, 3, 3, 8, 15, 3, 3, 6, 10, 5, 8, 8, 6, 8, 5, 15, 15, 8, 15, 3, 5, 6, 10, 8, 15, 15, 3, 15, 5, 15, 15, 15, 15, 3, 15, 5, 5, 5, 8, 5, 10, 5, 10, 8, 13, 15, 12, 3, 3 }; static const deUint8 anchorIndicesThirdSubset[64] = { 15, 8, 8, 3, 15, 15, 3, 8, 15, 15, 15, 15, 15, 15, 15, 8, 15, 8, 15, 3, 15, 8, 15, 8, 3, 15, 6, 10, 15, 15, 10, 8, 15, 3, 15, 10, 10, 8, 9, 10, 6, 15, 8, 15, 3, 6, 6, 8, 15, 3, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 3, 15, 15, 8 }; static const deUint16 weights2[4] = { 0, 21, 43, 64 }; static const deUint16 weights3[8] = { 0, 9, 18, 27, 37, 46, 55, 64 }; static const deUint16 weights4[16] = { 0, 4, 9, 13, 17, 21, 26, 30, 34, 38, 43, 47, 51, 55, 60, 64 }; inline float uint8ToFloat (deUint8 src) { return ((float)src / 255.0f); } inline float int8ToFloat (deInt8 src) { return ((float)src / 128.0f); } inline deUint32 bgr16torgba32 (deUint16 src) { const deUint32 src32 = src; const deUint8 b5 = (src32 & 0x1f); const deUint8 g6 = (src32 >> 5) & 0x3f; const deUint8 r5 = (src32 >> 11) & 0x1f; const deUint32 a8 = 0xff; const deUint32 b8 = extend5To8(b5); const deUint32 g8 = extend6To8(g6); const deUint32 r8 = extend5To8(r5); return (r8 | (g8 <<8) | (b8 << 16) | (a8 << 24)); } // Interpolates color = 1/3 * c0 + 2/3 * c1 inline deUint32 interpolateColor (deUint32 c0, deUint32 c1) { const deUint32 r0 = c0 & 0xff; const deUint32 g0 = (c0 >> 8) & 0xff; const deUint32 b0 = (c0 >> 16) & 0xff; const deUint32 a0 = (c0 >> 24) & 0xff; const deUint32 r1 = c1 & 0xff; const deUint32 g1 = (c1 >> 8) & 0xff; const deUint32 b1 = (c1 >> 16) & 0xff; const deUint32 a1 = (c1 >> 24) & 0xff; const deUint32 r = (r0 + (r1 << 1)) / 3; const deUint32 g = (g0 + (g1 << 1)) / 3; const deUint32 b = (b0 + (b1 << 1)) / 3; const deUint32 a = (a0 + (a1 << 1)) / 3; return (r | (g << 8) | (b << 16) | (a << 24)); } // Average of two colors inline deUint32 averageColor (deUint32 c0, deUint32 c1) { const deUint32 r0 = c0 & 0xff; const deUint32 g0 = (c0 >> 8) & 0xff; const deUint32 b0 = (c0 >> 16) & 0xff; const deUint32 a0 = (c0 >> 24) & 0xff; const deUint32 r1 = c1 & 0xff; const deUint32 g1 = (c1 >> 8) & 0xff; const deUint32 b1 = (c1 >> 16) & 0xff; const deUint32 a1 = (c1 >> 24) & 0xff; const deUint32 r = (r0 + r1) >> 1; const deUint32 g = (g0 + g1) >> 1; const deUint32 b = (b0 + b1) >> 1; const deUint32 a = (a0 + a1) >> 1; return (r | (g << 8) | (b << 16) | (a << 24)); } inline deInt8 extractModeBc6 (deUint8 src) { // Catch illegal modes switch(src & 0x1f) { case 0x13: case 0x17: case 0x1b: case 0x1f: return -1; }; switch (src & 0x3) { case 0: return 0; case 1: return 1; case 2: return (deInt8)(2 + ((src >> 2) & 0x7)); case 3: return (deInt8)(10 + ((src >> 2) & 0x7)); }; return -1; } inline deInt8 extractModeBc7 (deUint8 src) { for (deInt8 i = 0; i < 8; i++) if (src & (1 << i)) return i; return -1; } inline deUint64 get64BitBlockLE (const deUint8* src, int blockNdx) { // Same as get64BitBlock, but little-endian. deUint64 block = 0; for (int i = 0; i < 8; i++) block |= (deUint64)(src[blockNdx*8+i]) << (8ull*i); return block; } inline deUint32 getBits128 (deUint64 low, deUint64 high, deUint32 first, deUint32 last) { const deUint64 d[2] = { low, high }; const bool reverse = first > last; deUint32 ret = 0; if (reverse) { const deUint32 tmp = first; first = last; last = tmp; } const int elementFirst = first / 64; const int elementLast = last / 64; if (elementFirst == elementLast) { // Bits contained in one of the 64bit elements const deUint32 shift = first % 64; const deUint32 len = last - first + 1; const deUint32 mask = (1 << len) - 1; ret = (deUint32)((d[elementFirst] >> shift) & mask); } else { // Bits contained in both of the 64bit elements DE_ASSERT(last > 63); DE_ASSERT(first < 64); const deUint32 len0 = 64 - first; const deUint32 mask0 = (1 << len0) - 1; const deUint32 data0 = (deUint32)(low >> first) & mask0; const deUint32 len1 = last - 63; const deUint32 mask1 = (1 << len1) - 1; const deUint32 data1 = (deUint32)(high & mask1); ret = (deUint32)((data1 << len0) | data0); } if (reverse) { const deUint32 len = last - first + 1; const deUint32 orig = ret; ret = 0; for (deUint32 i = 0; i < len; i++) { ret |= ((orig >> (len - 1 - i)) & 1) << i; } } return ret; } inline deInt32 signExtend (deInt32 value, deInt32 srcBits, deInt32 dstBits) { deUint32 sign = value & (1 << (srcBits - 1)); if (!sign) return value; deInt32 dstMask = (deInt32)(((deUint64)1 << dstBits) - 1); deInt32 extendedBits = 0xffffffff << srcBits; return (value | extendedBits) & dstMask; } inline deInt32 unquantize (deInt32 x, int mode, bool hasSign) { if (hasSign) { bool s = false; if (epBits[mode] >= 16) return x; if (x < 0) { s = true; x = -x; } if (x == 0) x = 0; else if (x >= (((deInt32)1 << (epBits[mode] - 1)) - 1)) x = 0x7fff; else x = (((deInt32)x << 15) + 0x4000) >> (epBits[mode] - 1); if (s) x = -x; return x; } else { if (epBits[mode] >= 15) return x; else if (x == 0) return 0; else if (x == (((deInt32)1 << epBits[mode]) - 1)) return 0xffff; else return ((((deInt32)x << 15) + 0x4000) >> (epBits[mode] - 1)); } } inline deInt32 interpolate (deInt32 a, deInt32 b, deUint32 index, deUint32 indexPrecision) { const deUint16* weights[] = {weights2, weights3, weights4}; const deUint16* weight = weights[indexPrecision-2]; DE_ASSERT(indexPrecision >= 2 && indexPrecision <= 4); return (((64 - weight[index]) * a + weight[index] * b + 32) >> 6); } inline deInt16 finishUnquantize (deInt32 x, bool hasSign) { if (hasSign) { if (x < 0) x = -(((-x) * 31) >> 5); else x = (x * 31) >> 5; if (x < 0) x = (-x) | 0x8000; } else { x = (x * 31) / 64; } return (deInt16)x; } } // BcDecompressInternal void decompressBc1 (const PixelBufferAccess& dst, const deUint8* src, bool hasAlpha) { using namespace BcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const deUint32 dstRowPitch = dst.getRowPitch(); const deUint32 dstPixelSize = 4; const deUint16 color0_16 = ((deUint16*)src)[0]; const deUint16 color1_16 = ((deUint16*)src)[1]; const deUint32 color0 = bgr16torgba32(color0_16); const deUint32 color1 = bgr16torgba32(color1_16); const deUint8* const indices8 = &src[4]; const bool alphaMode = color1_16 > color0_16; const deInt32 indices[16] = { (indices8[0] >> 0) & 0x3, (indices8[0] >> 2) & 0x3, (indices8[0] >> 4) & 0x3, (indices8[0] >> 6) & 0x3, (indices8[1] >> 0) & 0x3, (indices8[1] >> 2) & 0x3, (indices8[1] >> 4) & 0x3, (indices8[1] >> 6) & 0x3, (indices8[2] >> 0) & 0x3, (indices8[2] >> 2) & 0x3, (indices8[2] >> 4) & 0x3, (indices8[2] >> 6) & 0x3, (indices8[3] >> 0) & 0x3, (indices8[3] >> 2) & 0x3, (indices8[3] >> 4) & 0x3, (indices8[3] >> 6) & 0x3 }; const deUint32 colors[4] = { color0, color1, alphaMode ? averageColor(color0, color1) : interpolateColor(color1, color0), alphaMode ? (hasAlpha ? 0 : 0xff000000) : interpolateColor(color0, color1) }; for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) { for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) { deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize); *dstPixel = colors[indices[y * BC_BLOCK_WIDTH + x]]; } } } void decompressBc2 (const PixelBufferAccess& dst, const deUint8* src) { using namespace BcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const deUint32 dstRowPitch = dst.getRowPitch(); const deUint32 dstPixelSize = 4; const deUint16 color0_16 = ((deUint16*)src)[4]; const deUint16 color1_16 = ((deUint16*)src)[5]; const deUint32 color0 = bgr16torgba32(color0_16); const deUint32 color1 = bgr16torgba32(color1_16); const deUint8* const indices8 = &src[12]; const deUint8* const alphas8 = src; const deInt32 indices[16] = { (indices8[0] >> 0) & 0x3, (indices8[0] >> 2) & 0x3, (indices8[0] >> 4) & 0x3, (indices8[0] >> 6) & 0x3, (indices8[1] >> 0) & 0x3, (indices8[1] >> 2) & 0x3, (indices8[1] >> 4) & 0x3, (indices8[1] >> 6) & 0x3, (indices8[2] >> 0) & 0x3, (indices8[2] >> 2) & 0x3, (indices8[2] >> 4) & 0x3, (indices8[2] >> 6) & 0x3, (indices8[3] >> 0) & 0x3, (indices8[3] >> 2) & 0x3, (indices8[3] >> 4) & 0x3, (indices8[3] >> 6) & 0x3 }; const deInt32 alphas[16] = { extend4To8(((alphas8[0] >> 0) & 0xf)) << 24, extend4To8(((alphas8[0] >> 4) & 0xf)) << 24, extend4To8(((alphas8[1] >> 0) & 0xf)) << 24, extend4To8(((alphas8[1] >> 4) & 0xf)) << 24, extend4To8(((alphas8[2] >> 0) & 0xf)) << 24, extend4To8(((alphas8[2] >> 4) & 0xf)) << 24, extend4To8(((alphas8[3] >> 0) & 0xf)) << 24, extend4To8(((alphas8[3] >> 4) & 0xf)) << 24, extend4To8(((alphas8[4] >> 0) & 0xf)) << 24, extend4To8(((alphas8[4] >> 4) & 0xf)) << 24, extend4To8(((alphas8[5] >> 0) & 0xf)) << 24, extend4To8(((alphas8[5] >> 4) & 0xf)) << 24, extend4To8(((alphas8[6] >> 0) & 0xf)) << 24, extend4To8(((alphas8[6] >> 4) & 0xf)) << 24, extend4To8(((alphas8[7] >> 0) & 0xf)) << 24, extend4To8(((alphas8[7] >> 4) & 0xf)) << 24 }; const deUint32 colors[4] = { color0, color1, interpolateColor(color1, color0), interpolateColor(color0, color1) }; for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) { for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) { deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize); *dstPixel = (colors[indices[y * BC_BLOCK_WIDTH + x]] & 0x00ffffff) | alphas[y * BC_BLOCK_WIDTH + x]; } } } void decompressBc3 (const PixelBufferAccess& dst, const deUint8* src) { using namespace BcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const deUint32 dstRowPitch = dst.getRowPitch(); const deUint32 dstPixelSize = 4; const deUint8 alpha0 = src[0]; const deUint8 alpha1 = src[1]; const deUint16 color0_16 = ((deUint16*)src)[4]; const deUint16 color1_16 = ((deUint16*)src)[5]; const deUint32 color0 = bgr16torgba32(color0_16); const deUint32 color1 = bgr16torgba32(color1_16); const deUint8* const indices8 = &src[12]; const deUint64 alphaBits = get64BitBlockLE(src, 0) >> 16; deUint32 alphas[8]; const deInt32 indices[16] = { (indices8[0] >> 0) & 0x3, (indices8[0] >> 2) & 0x3, (indices8[0] >> 4) & 0x3, (indices8[0] >> 6) & 0x3, (indices8[1] >> 0) & 0x3, (indices8[1] >> 2) & 0x3, (indices8[1] >> 4) & 0x3, (indices8[1] >> 6) & 0x3, (indices8[2] >> 0) & 0x3, (indices8[2] >> 2) & 0x3, (indices8[2] >> 4) & 0x3, (indices8[2] >> 6) & 0x3, (indices8[3] >> 0) & 0x3, (indices8[3] >> 2) & 0x3, (indices8[3] >> 4) & 0x3, (indices8[3] >> 6) & 0x3 }; const deInt32 alphaIndices[16] = { (deInt32)((alphaBits >> 0) & 0x7), (deInt32)((alphaBits >> 3) & 0x7), (deInt32)((alphaBits >> 6) & 0x7), (deInt32)((alphaBits >> 9) & 0x7), (deInt32)((alphaBits >> 12) & 0x7), (deInt32)((alphaBits >> 15) & 0x7), (deInt32)((alphaBits >> 18) & 0x7), (deInt32)((alphaBits >> 21) & 0x7), (deInt32)((alphaBits >> 24) & 0x7), (deInt32)((alphaBits >> 27) & 0x7), (deInt32)((alphaBits >> 30) & 0x7), (deInt32)((alphaBits >> 33) & 0x7), (deInt32)((alphaBits >> 36) & 0x7), (deInt32)((alphaBits >> 39) & 0x7), (deInt32)((alphaBits >> 42) & 0x7), (deInt32)((alphaBits >> 45) & 0x7) }; const deUint32 colors[4] = { color0, color1, interpolateColor(color1, color0), interpolateColor(color0, color1) }; alphas[0] = alpha0 << 24; alphas[1] = alpha1 << 24; if (alpha0 > alpha1) { for (deUint32 i = 0; i < 6; i++) alphas[i + 2] = (((deUint32)alpha0 * (6 - i) + (deUint32)alpha1 * (1 + i)) / 7) << 24; } else { for (deUint32 i = 0; i < 4; i++) alphas[i + 2] = (((deUint32)alpha0 * (4 - i) + (deUint32)alpha1 * (1 + i)) / 5) << 24; alphas[6] = 0; alphas[7] = 0xff000000; } for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) { for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) { deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize); *dstPixel = (colors[indices[y * BC_BLOCK_WIDTH + x]] & 0x00ffffff) | alphas[alphaIndices[y * BC_BLOCK_WIDTH + x]]; } } } void decompressBc4 (const PixelBufferAccess& dst, const deUint8* src, bool hasSign) { using namespace BcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const deUint32 dstRowPitch = dst.getRowPitch(); const deUint32 dstPixelSize = 4; const deUint8 red0 = src[0]; const deUint8 red1 = src[1]; const deInt8 red0s = ((deInt8*)src)[0]; const deInt8 red1s = ((deInt8*)src)[1]; const deUint64 indexBits = get64BitBlockLE(src, 0) >> 16; float reds[8]; const deInt32 indices[16] = { (deInt32)((indexBits >> 0) & 0x7), (deInt32)((indexBits >> 3) & 0x7), (deInt32)((indexBits >> 6) & 0x7), (deInt32)((indexBits >> 9) & 0x7), (deInt32)((indexBits >> 12) & 0x7), (deInt32)((indexBits >> 15) & 0x7), (deInt32)((indexBits >> 18) & 0x7), (deInt32)((indexBits >> 21) & 0x7), (deInt32)((indexBits >> 24) & 0x7), (deInt32)((indexBits >> 27) & 0x7), (deInt32)((indexBits >> 30) & 0x7), (deInt32)((indexBits >> 33) & 0x7), (deInt32)((indexBits >> 36) & 0x7), (deInt32)((indexBits >> 39) & 0x7), (deInt32)((indexBits >> 42) & 0x7), (deInt32)((indexBits >> 45) & 0x7) }; reds[0] = hasSign ? int8ToFloat(red0s) : uint8ToFloat(red0); reds[1] = hasSign ? int8ToFloat(red1s) : uint8ToFloat(red1); if (reds[0] > reds[1]) { for (deUint32 i = 0; i < 6; i++) reds[i + 2] = (reds[0] * (6.0f - (float)i) + reds[1] * (1.0f + (float)i)) / 7.0f; } else { for (deUint32 i = 0; i < 4; i++) reds[i + 2] = (reds[0] * (4.0f - (float)i) + reds[1] * (1.0f + (float)i)) / 5.0f; reds[6] = hasSign ? -1.0f : 0.0f; reds[7] = 1.0f; } for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) { for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) { float* const dstPixel = (float*)(dstPtr + y * dstRowPitch + x * dstPixelSize); *dstPixel = reds[indices[y * BC_BLOCK_WIDTH + x]]; } } } void decompressBc5 (const PixelBufferAccess& dst, const deUint8* src, bool hasSign) { using namespace BcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const deUint32 dstRowPitch = dst.getRowPitch(); const deUint32 dstPixelSize = 8; float rg[2][8]; deUint32 indices[2][16]; for (deUint32 c = 0; c < 2; c++) { const deUint32 offset = c * 8; const deUint8 rg0 = src[offset]; const deUint8 rg1 = src[offset + 1]; const deInt8 rg0s = ((deInt8*)src)[offset]; const deInt8 rg1s = ((deInt8*)src)[offset + 1]; const deUint64 indexBits = get64BitBlockLE(src, c) >> 16; for (deUint32 i = 0; i < 16; i++) indices[c][i] = (indexBits >> (i * 3)) & 0x7; rg[c][0] = hasSign ? int8ToFloat(rg0s) : uint8ToFloat(rg0); rg[c][1] = hasSign ? int8ToFloat(rg1s) : uint8ToFloat(rg1); if (rg[c][0] > rg[c][1]) { for (deUint32 i = 0; i < 6; i++) rg[c][i + 2] = (rg[c][0] * (6.0f - (float)i) + rg[c][1] * (1.0f + (float)i)) / 7.0f; } else { for (deUint32 i = 0; i < 4; i++) rg[c][i + 2] = (rg[c][0] * (4.0f - (float)i) + rg[c][1] * (1.0f + (float)i)) / 5.0f; rg[c][6] = hasSign ? -1.0f : 0.0f; rg[c][7] = 1.0f; } } for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) { for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) { float* const dstPixel = (float*)(dstPtr + y * dstRowPitch + x * dstPixelSize); for (deUint32 i = 0; i < 2; i++) dstPixel[i] = rg[i][indices[i][y * BC_BLOCK_WIDTH + x]]; } } } void decompressBc6H (const PixelBufferAccess& dst, const deUint8* src, bool hasSign) { using namespace BcDecompressInternal; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const deUint32 dstRowPitch = dst.getRowPitch(); const deUint32 dstPixelSize = 6; deInt32 mode = extractModeBc6(src[0]); IVec4 r (0); IVec4 g (0); IVec4 b (0); deUint32 deltaBitsR = 0; deUint32 deltaBitsG = 0; deUint32 deltaBitsB = 0; const deUint64 low = ((deUint64*)src)[0]; const deUint64 high = ((deUint64*)src)[1]; const deUint32 d = mode < 10 ? getBits128(low, high, 77, 81) : 0; const deUint32 numRegions = mode > 9 ? 1 : 2; const deUint32 numEndpoints = numRegions * 2; const bool transformed = mode != 9 && mode != 10; const deUint32 colorIndexBC = mode < 10 ? 3 : 4; deUint64 colorIndexData = high >> (mode < 10 ? 18 : 1); const deUint32 anchorIndex[2] = { 0, anchorIndicesSecondSubset2[d] }; switch (mode) { case 0: g[2] |= getBits128(low, high, 2, 2) << 4; b[2] |= getBits128(low, high, 3, 3) << 4; b[3] |= getBits128(low, high, 4, 4) << 4; r[0] |= getBits128(low, high, 5, 14); g[0] |= getBits128(low, high, 15, 24); b[0] |= getBits128(low, high, 25, 34); r[1] |= getBits128(low, high, 35, 39); g[3] |= getBits128(low, high, 40, 40) << 4; g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 49); b[3] |= getBits128(low, high, 50, 50); g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 59); b[3] |= getBits128(low, high, 60, 60) << 1; b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 69); b[3] |= getBits128(low, high, 70, 70) << 2; r[3] |= getBits128(low, high, 71, 75); b[3] |= getBits128(low, high, 76, 76) << 3; deltaBitsR = deltaBitsG = deltaBitsB = 5; break; case 1: g[2] |= getBits128(low, high, 2, 2) << 5; g[3] |= getBits128(low, high, 3, 3) << 4; g[3] |= getBits128(low, high, 4, 4) << 5; r[0] |= getBits128(low, high, 5, 11); b[3] |= getBits128(low, high, 12, 12); b[3] |= getBits128(low, high, 13, 13) << 1; b[2] |= getBits128(low, high, 14, 14) << 4; g[0] |= getBits128(low, high, 15, 21); b[2] |= getBits128(low, high, 22, 22) << 5; b[3] |= getBits128(low, high, 23, 23) << 2; g[2] |= getBits128(low, high, 24, 24) << 4; b[0] |= getBits128(low, high, 25, 31); b[3] |= getBits128(low, high, 32, 32) << 3; b[3] |= getBits128(low, high, 33, 33) << 5; b[3] |= getBits128(low, high, 34, 34) << 4; r[1] |= getBits128(low, high, 35, 40); g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 50); g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 60); b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 70); r[3] |= getBits128(low, high, 71, 76); deltaBitsR = deltaBitsG = deltaBitsB = 6; break; case 2: r[0] |= getBits128(low, high, 5, 14); g[0] |= getBits128(low, high, 15, 24); b[0] |= getBits128(low, high, 25, 34); r[1] |= getBits128(low, high, 35, 39); r[0] |= getBits128(low, high, 40, 40) << 10; g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 48); g[0] |= getBits128(low, high, 49, 49) << 10; b[3] |= getBits128(low, high, 50, 50); g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 58); b[0] |= getBits128(low, high, 59, 59) << 10; b[3] |= getBits128(low, high, 60, 60) << 1; b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 69); b[3] |= getBits128(low, high, 70, 70) << 2; r[3] |= getBits128(low, high, 71, 75); b[3] |= getBits128(low, high, 76, 76) << 3; deltaBitsR = 5; deltaBitsG = deltaBitsB = 4; break; case 3: r[0] |= getBits128(low, high, 5, 14); g[0] |= getBits128(low, high, 15, 24); b[0] |= getBits128(low, high, 25, 34); r[1] |= getBits128(low, high, 35, 38); r[0] |= getBits128(low, high, 39, 39) << 10; g[3] |= getBits128(low, high, 40, 40) << 4; g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 49); g[0] |= getBits128(low, high, 50, 50) << 10; g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 58); b[0] |= getBits128(low, high, 59, 59) << 10; b[3] |= getBits128(low, high, 60, 60) << 1; b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 68); b[3] |= getBits128(low, high, 69, 69); b[3] |= getBits128(low, high, 70, 70) << 2; r[3] |= getBits128(low, high, 71, 74); g[2] |= getBits128(low, high, 75, 75) << 4; b[3] |= getBits128(low, high, 76, 76) << 3; deltaBitsR = deltaBitsB = 4; deltaBitsG = 5; break; case 4: r[0] |= getBits128(low, high, 5, 14); g[0] |= getBits128(low, high, 15, 24); b[0] |= getBits128(low, high, 25, 34); r[1] |= getBits128(low, high, 35, 38); r[0] |= getBits128(low, high, 39, 39) << 10; b[2] |= getBits128(low, high, 40, 40) << 4; g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 48); g[0] |= getBits128(low, high, 49, 49) << 10; b[3] |= getBits128(low, high, 50, 50); g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 59); b[0] |= getBits128(low, high, 60, 60) << 10; b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 68); b[3] |= getBits128(low, high, 69, 69) << 1; b[3] |= getBits128(low, high, 70, 70) << 2; r[3] |= getBits128(low, high, 71, 74); b[3] |= getBits128(low, high, 75, 75) << 4; b[3] |= getBits128(low, high, 76, 76) << 3; deltaBitsR = deltaBitsG = 4; deltaBitsB = 5; break; case 5: r[0] |= getBits128(low, high, 5, 13); b[2] |= getBits128(low, high, 14, 14) << 4; g[0] |= getBits128(low, high, 15, 23); g[2] |= getBits128(low, high, 24, 24) << 4; b[0] |= getBits128(low, high, 25, 33); b[3] |= getBits128(low, high, 34, 34) << 4; r[1] |= getBits128(low, high, 35, 39); g[3] |= getBits128(low, high, 40, 40) << 4; g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 49); b[3] |= getBits128(low, high, 50, 50); g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 59); b[3] |= getBits128(low, high, 60, 60) << 1; b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 69); b[3] |= getBits128(low, high, 70, 70) << 2; r[3] |= getBits128(low, high, 71, 75); b[3] |= getBits128(low, high, 76, 76) << 3; deltaBitsR = deltaBitsG = deltaBitsB = 5; break; case 6: r[0] |= getBits128(low, high, 5, 12); g[3] |= getBits128(low, high, 13, 13) << 4; b[2] |= getBits128(low, high, 14, 14) << 4; g[0] |= getBits128(low, high, 15, 22); b[3] |= getBits128(low, high, 23, 23) << 2; g[2] |= getBits128(low, high, 24, 24) << 4; b[0] |= getBits128(low, high, 25, 32); b[3] |= getBits128(low, high, 33, 33) << 3; b[3] |= getBits128(low, high, 34, 34) << 4; r[1] |= getBits128(low, high, 35, 40); g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 49); b[3] |= getBits128(low, high, 50, 50); g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 59); b[3] |= getBits128(low, high, 60, 60) << 1; b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 70); r[3] |= getBits128(low, high, 71, 76); deltaBitsR = 6; deltaBitsG = deltaBitsB = 5; break; case 7: r[0] |= getBits128(low, high, 5, 12); b[3] |= getBits128(low, high, 13, 13); b[2] |= getBits128(low, high, 14, 14) << 4; g[0] |= getBits128(low, high, 15, 22); g[2] |= getBits128(low, high, 23, 23) << 5; g[2] |= getBits128(low, high, 24, 24) << 4; b[0] |= getBits128(low, high, 25, 32); g[3] |= getBits128(low, high, 33, 33) << 5; b[3] |= getBits128(low, high, 34, 34) << 4; r[1] |= getBits128(low, high, 35, 39); g[3] |= getBits128(low, high, 40, 40) << 4; g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 50); g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 59); b[3] |= getBits128(low, high, 60, 60) << 1; b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 69); b[3] |= getBits128(low, high, 70, 70) << 2; r[3] |= getBits128(low, high, 71, 75); b[3] |= getBits128(low, high, 76, 76) << 3; deltaBitsR = deltaBitsB = 5; deltaBitsG = 6; break; case 8: r[0] |= getBits128(low, high, 5, 12); b[3] |= getBits128(low, high, 13, 13) << 1; b[2] |= getBits128(low, high, 14, 14) << 4; g[0] |= getBits128(low, high, 15, 22); b[2] |= getBits128(low, high, 23, 23) << 5; g[2] |= getBits128(low, high, 24, 24) << 4; b[0] |= getBits128(low, high, 25, 32); b[3] |= getBits128(low, high, 33, 33) << 5; b[3] |= getBits128(low, high, 34, 34) << 4; r[1] |= getBits128(low, high, 35, 39); g[3] |= getBits128(low, high, 40, 40) << 4; g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 49); b[3] |= getBits128(low, high, 50, 50); g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 60); b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 69); b[3] |= getBits128(low, high, 70, 70) << 2; r[3] |= getBits128(low, high, 71, 75); b[3] |= getBits128(low, high, 76, 76) << 3; deltaBitsR = deltaBitsG = 5; deltaBitsB = 6; break; case 9: r[0] |= getBits128(low, high, 5, 10); g[3] |= getBits128(low, high, 11, 11) << 4; b[3] |= getBits128(low, high, 12, 13); b[2] |= getBits128(low, high, 14, 14) << 4; g[0] |= getBits128(low, high, 15, 20); g[2] |= getBits128(low, high, 21, 21) << 5; b[2] |= getBits128(low, high, 22, 22) << 5; b[3] |= getBits128(low, high, 23, 23) << 2; g[2] |= getBits128(low, high, 24, 24) << 4; b[0] |= getBits128(low, high, 25, 30); g[3] |= getBits128(low, high, 31, 31) << 5; b[3] |= getBits128(low, high, 32, 32) << 3; b[3] |= getBits128(low, high, 33, 33) << 5; b[3] |= getBits128(low, high, 34, 34) << 4; r[1] |= getBits128(low, high, 35, 40); g[2] |= getBits128(low, high, 41, 44); g[1] |= getBits128(low, high, 45, 50); g[3] |= getBits128(low, high, 51, 54); b[1] |= getBits128(low, high, 55, 60); b[2] |= getBits128(low, high, 61, 64); r[2] |= getBits128(low, high, 65, 70); r[3] |= getBits128(low, high, 71, 76); deltaBitsR = deltaBitsG = deltaBitsB = 6; break; case 10: r[0] |= getBits128(low, high, 5, 14); g[0] |= getBits128(low, high, 15, 24); b[0] |= getBits128(low, high, 25, 34); r[1] |= getBits128(low, high, 35, 44); g[1] |= getBits128(low, high, 45, 54); b[1] |= getBits128(low, high, 55, 64); deltaBitsR = deltaBitsG = deltaBitsB = 10; break; case 11: r[0] |= getBits128(low, high, 5, 14); g[0] |= getBits128(low, high, 15, 24); b[0] |= getBits128(low, high, 25, 34); r[1] |= getBits128(low, high, 35, 43); r[0] |= getBits128(low, high, 44, 44) << 10; g[1] |= getBits128(low, high, 45, 53); g[0] |= getBits128(low, high, 54, 54) << 10; b[1] |= getBits128(low, high, 55, 63); b[0] |= getBits128(low, high, 64, 64) << 10; deltaBitsR = deltaBitsG = deltaBitsB = 9; break; case 12: r[0] |= getBits128(low, high, 5, 14); g[0] |= getBits128(low, high, 15, 24); b[0] |= getBits128(low, high, 25, 34); r[1] |= getBits128(low, high, 35, 42); r[0] |= getBits128(low, high, 44, 43) << 10; g[1] |= getBits128(low, high, 45, 52); g[0] |= getBits128(low, high, 54, 53) << 10; b[1] |= getBits128(low, high, 55, 62); b[0] |= getBits128(low, high, 64, 63) << 10; deltaBitsR = deltaBitsG = deltaBitsB = 8; break; case 13: r[0] |= getBits128(low, high, 5, 14); g[0] |= getBits128(low, high, 15, 24); b[0] |= getBits128(low, high, 25, 34); r[1] |= getBits128(low, high, 35, 38); r[0] |= getBits128(low, high, 44, 39) << 10; g[1] |= getBits128(low, high, 45, 48); g[0] |= getBits128(low, high, 54, 49) << 10; b[1] |= getBits128(low, high, 55, 58); b[0] |= getBits128(low, high, 64, 59) << 10; deltaBitsR = deltaBitsG = deltaBitsB = 4; break; }; if (hasSign) { r[0] = signExtend(r[0], epBits[mode], 32); g[0] = signExtend(g[0], epBits[mode], 32); b[0] = signExtend(b[0], epBits[mode], 32); } if (transformed) { for (deUint32 i = 1; i < numEndpoints; i++) { r[i] = signExtend(r[i], deltaBitsR, 32); r[i] = (r[0] + r[i]) & (((deUint32)1 << epBits[mode]) - 1); g[i] = signExtend(g[i], deltaBitsG, 32); g[i] = (g[0] + g[i]) & (((deUint32)1 << epBits[mode]) - 1); b[i] = signExtend(b[i], deltaBitsB, 32); b[i] = (b[0] + b[i]) & (((deUint32)1 << epBits[mode]) - 1); } } if (hasSign) { for (deUint32 i = 1; i < 4; i++) { r[i] = signExtend(r[i], epBits[mode], 32); g[i] = signExtend(g[i], epBits[mode], 32); b[i] = signExtend(b[i], epBits[mode], 32); } } for (deUint32 i = 0; i < numEndpoints; i++) { r[i] = unquantize(r[i], mode, hasSign); g[i] = unquantize(g[i], mode, hasSign); b[i] = unquantize(b[i], mode, hasSign); } for (deUint32 i = 0; i < 16; i++) { const deUint32 subsetIndex = (numRegions == 1 ? 0 : partitions2[d][i]); const deUint32 bits = (i == anchorIndex[subsetIndex]) ? (colorIndexBC - 1) : colorIndexBC; const deUint32 colorIndex = (deUint32)(colorIndexData & ((1 << bits) - 1)); const deInt32 endpointStartR = r[2 * subsetIndex]; const deInt32 endpointEndR = r[2 * subsetIndex + 1]; const deInt32 endpointStartG = g[2 * subsetIndex]; const deInt32 endpointEndG = g[2 * subsetIndex + 1]; const deInt32 endpointStartB = b[2 * subsetIndex]; const deInt32 endpointEndB = b[2 * subsetIndex + 1]; const deInt16 r16 = finishUnquantize(interpolate(endpointStartR, endpointEndR, colorIndex, colorIndexBC), hasSign); const deInt16 g16 = finishUnquantize(interpolate(endpointStartG, endpointEndG, colorIndex, colorIndexBC), hasSign); const deInt16 b16 = finishUnquantize(interpolate(endpointStartB, endpointEndB, colorIndex, colorIndexBC), hasSign); const deInt32 y = i / 4; const deInt32 x = i % 4; deInt16* const dstPixel = (deInt16*)(dstPtr + y * dstRowPitch + x * dstPixelSize); if (mode == -1) { dstPixel[0] = 0; dstPixel[1] = 0; dstPixel[2] = 0; } else { dstPixel[0] = r16; dstPixel[1] = g16; dstPixel[2] = b16; } colorIndexData >>= bits; } } void decompressBc7 (const PixelBufferAccess& dst, const deUint8* src) { using namespace BcDecompressInternal; static const deUint8 subsets[] = { 3, 2, 3, 2, 1, 1, 1, 2 }; static const deUint8 partitionBits[] = { 4, 6, 6, 6, 0, 0, 0, 6 }; static const deUint8 endpointBits[8][5] = { //r, g, b, a, p { 4, 4, 4, 0, 1 }, { 6, 6, 6, 0, 1 }, { 5, 5, 5, 0, 0 }, { 7, 7, 7, 0, 1 }, { 5, 5, 5, 6, 0 }, { 7, 7, 7, 8, 0 }, { 7, 7, 7, 7, 1 }, { 5, 5, 5, 5, 1 } }; static const deUint8 indexBits[] = { 3, 3, 2, 2, 2, 2, 4, 2 }; deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); const deUint32 dstRowPitch = dst.getRowPitch(); const deUint32 dstPixelSize = 4; const deUint64 low = ((deUint64*)src)[0]; const deUint64 high = ((deUint64*)src)[1]; const deInt32 mode = extractModeBc7(src[0]); deUint32 numSubsets = 1; deUint32 offset = mode + 1; deUint32 rotation = 0; deUint32 idxMode = 0; deUint32 endpoints[6][5]; deUint32 partitionSetId = 0; // Decode partition data from explicit partition bits if (mode == 0 || mode == 1 || mode == 2 || mode == 3 || mode == 7) { numSubsets = subsets[mode]; partitionSetId = getBits128(low, high, offset, offset + partitionBits[mode] - 1); offset += partitionBits[mode]; } // Extract rotation bits if (mode == 4 || mode == 5) { rotation = getBits128(low, high, offset, offset + 1); offset += 2; if (mode == 4) { idxMode = getBits128(low, high, offset, offset); offset++; } } { const deUint32 numEndpoints = numSubsets * 2; // Extract raw, compressed endpoint bits for (deUint32 cpnt = 0; cpnt < 5; cpnt++) { for (deUint32 ep = 0; ep < numEndpoints; ep++) { if (mode == 1 && cpnt == 4 && ep > 1) continue; // Mode 1 has shared P bits int n = mode == -1 ? 0 : endpointBits[mode][cpnt]; if (n > 0) endpoints[ep][cpnt] = getBits128(low, high, offset, offset + n - 1); offset += n; } } // Decode endpoints if (mode == 0 || mode == 1 || mode == 3 || mode == 6 || mode == 7) { // First handle modes that have P-bits for (deUint32 ep = 0; ep < numEndpoints; ep++) { for (deUint32 cpnt = 0; cpnt < 4; cpnt++) { endpoints[ep][cpnt] <<= 1; } } if (mode == 1) { // P-bit is shared const deUint32 pbitZero = endpoints[0][4]; const deUint32 pbitOne = endpoints[1][4]; for (deUint32 cpnt = 0; cpnt < 3; cpnt++) { endpoints[0][cpnt] |= pbitZero; endpoints[1][cpnt] |= pbitZero; endpoints[2][cpnt] |= pbitOne; endpoints[3][cpnt] |= pbitOne; } } else { // Unique p-bit per endpoint for (deUint32 ep = 0; ep < numEndpoints; ep++) { for (deUint32 cpnt = 0; cpnt < 4; cpnt++) { endpoints[ep][cpnt] |= endpoints[ep][4]; } } } } for (deUint32 ep = 0; ep < numEndpoints; ep++) { // Left shift endpoint components so that their MSB lies in bit 7 for (deUint32 cpnt = 0; cpnt < 4; cpnt++) endpoints[ep][cpnt] <<= 8 - (endpointBits[mode][cpnt] + endpointBits[mode][4]); // Replicate each component's MSB into the LSBs revealed by the left-shift operation above for (deUint32 cpnt = 0; cpnt < 4; cpnt++) endpoints[ep][cpnt] |= endpoints[ep][cpnt] >> (endpointBits[mode][cpnt] + endpointBits[mode][4]); } // If this mode does not explicitly define the alpha component set alpha equal to 1.0 if (mode < 4) { for (deUint32 ep = 0; ep < numEndpoints; ep++) endpoints[ep][3] = 255; } } { deUint32 colorIdxOffset = offset + ((mode == 4 && idxMode) ? 31 : 0); deUint32 alphaIdxOffset = offset + ((mode == 5 || (mode == 4 && !idxMode)) ? 31 : 0); for (deUint32 pixel = 0; pixel < 16; pixel++) { const deUint32 y = pixel / 4; const deUint32 x = pixel % 4; deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize); deUint32 subsetIndex = 0; deUint32 anchorIndex = 0; deUint32 endpointStart[4]; deUint32 endpointEnd[4]; if (mode == -1) { *dstPixel = 0; continue; } if (numSubsets == 2) subsetIndex = partitions2[partitionSetId][pixel]; else if (numSubsets == 3) subsetIndex = partitions3[partitionSetId][pixel]; if (numSubsets == 2 && subsetIndex == 1) { anchorIndex = anchorIndicesSecondSubset2[partitionSetId]; } else if (numSubsets == 3) { if (subsetIndex == 1) anchorIndex = anchorIndicesSecondSubset3[partitionSetId]; else if (subsetIndex == 2) anchorIndex = anchorIndicesThirdSubset[partitionSetId]; } for (deUint32 cpnt = 0; cpnt < 4; cpnt++) { endpointStart[cpnt] = endpoints[2 * subsetIndex][cpnt]; endpointEnd[cpnt] = endpoints[2 * subsetIndex + 1][cpnt]; } { const deUint32 colorInterpolationBits = indexBits[mode] + idxMode; const deUint32 colorIndexBits = colorInterpolationBits - ((anchorIndex == pixel) ? 1 : 0); const deUint32 alphaInterpolationBits = mode == 4 ? 3 - idxMode : (mode == 5 ? 2 : colorInterpolationBits); const deUint32 alphaIndexBits = alphaInterpolationBits - ((anchorIndex == pixel) ? 1 : 0); const deUint32 colorIdx = getBits128(low, high, colorIdxOffset, colorIdxOffset + colorIndexBits - 1); const deUint32 alphaIdx = (mode == 4 || mode == 5) ? getBits128(low, high, alphaIdxOffset, alphaIdxOffset + alphaIndexBits - 1) : colorIdx; const deUint32 r = interpolate(endpointStart[0], endpointEnd[0], colorIdx, colorInterpolationBits); const deUint32 g = interpolate(endpointStart[1], endpointEnd[1], colorIdx, colorInterpolationBits); const deUint32 b = interpolate(endpointStart[2], endpointEnd[2], colorIdx, colorInterpolationBits); const deUint32 a = interpolate(endpointStart[3], endpointEnd[3], alphaIdx, alphaInterpolationBits); colorIdxOffset += colorIndexBits; alphaIdxOffset += alphaIndexBits; if ((mode == 4 || mode == 5) && rotation != 0) { if (rotation == 1) *dstPixel = a | (g << 8) | (b << 16) | (r << 24); else if (rotation == 2) *dstPixel = r | (a << 8) | (b << 16) | (g << 24); else *dstPixel = r | (g << 8) | (a << 16) | (b << 24); } else { *dstPixel = r | (g << 8) | (b << 16) | (a << 24); } } } } } void decompressBlock (CompressedTexFormat format, const PixelBufferAccess& dst, const deUint8* src, const TexDecompressionParams& params) { // No 3D blocks supported right now DE_ASSERT(dst.getDepth() == 1); switch (format) { case COMPRESSEDTEXFORMAT_ETC1_RGB8: decompressETC1 (dst, src); break; case COMPRESSEDTEXFORMAT_EAC_R11: decompressEAC_R11 (dst, src, false); break; case COMPRESSEDTEXFORMAT_EAC_SIGNED_R11: decompressEAC_R11 (dst, src, true); break; case COMPRESSEDTEXFORMAT_EAC_RG11: decompressEAC_RG11 (dst, src, false); break; case COMPRESSEDTEXFORMAT_EAC_SIGNED_RG11: decompressEAC_RG11 (dst, src, true); break; case COMPRESSEDTEXFORMAT_ETC2_RGB8: decompressETC2 (dst, src); break; case COMPRESSEDTEXFORMAT_ETC2_SRGB8: decompressETC2 (dst, src); break; case COMPRESSEDTEXFORMAT_ETC2_RGB8_PUNCHTHROUGH_ALPHA1: decompressETC2_RGB8_PUNCHTHROUGH_ALPHA1 (dst, src); break; case COMPRESSEDTEXFORMAT_ETC2_SRGB8_PUNCHTHROUGH_ALPHA1: decompressETC2_RGB8_PUNCHTHROUGH_ALPHA1 (dst, src); break; case COMPRESSEDTEXFORMAT_ETC2_EAC_RGBA8: decompressETC2_EAC_RGBA8 (dst, src); break; case COMPRESSEDTEXFORMAT_ETC2_EAC_SRGB8_ALPHA8: decompressETC2_EAC_RGBA8 (dst, src); break; case COMPRESSEDTEXFORMAT_ASTC_4x4_RGBA: case COMPRESSEDTEXFORMAT_ASTC_5x4_RGBA: case COMPRESSEDTEXFORMAT_ASTC_5x5_RGBA: case COMPRESSEDTEXFORMAT_ASTC_6x5_RGBA: case COMPRESSEDTEXFORMAT_ASTC_6x6_RGBA: case COMPRESSEDTEXFORMAT_ASTC_8x5_RGBA: case COMPRESSEDTEXFORMAT_ASTC_8x6_RGBA: case COMPRESSEDTEXFORMAT_ASTC_8x8_RGBA: case COMPRESSEDTEXFORMAT_ASTC_10x5_RGBA: case COMPRESSEDTEXFORMAT_ASTC_10x6_RGBA: case COMPRESSEDTEXFORMAT_ASTC_10x8_RGBA: case COMPRESSEDTEXFORMAT_ASTC_10x10_RGBA: case COMPRESSEDTEXFORMAT_ASTC_12x10_RGBA: case COMPRESSEDTEXFORMAT_ASTC_12x12_RGBA: case COMPRESSEDTEXFORMAT_ASTC_4x4_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_5x4_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_5x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_6x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_6x6_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_8x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_8x6_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_8x8_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x5_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x6_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x8_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_10x10_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_12x10_SRGB8_ALPHA8: case COMPRESSEDTEXFORMAT_ASTC_12x12_SRGB8_ALPHA8: astc::decompress(dst, src, format, params.astcMode); break; case COMPRESSEDTEXFORMAT_BC1_RGB_UNORM_BLOCK: decompressBc1 (dst, src, false); break; case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK: decompressBc1 (dst, src, false); break; case COMPRESSEDTEXFORMAT_BC1_RGBA_UNORM_BLOCK: decompressBc1 (dst, src, true); break; case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK: decompressBc1 (dst, src, true); break; case COMPRESSEDTEXFORMAT_BC2_UNORM_BLOCK: decompressBc2 (dst, src); break; case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK: decompressBc2 (dst, src); break; case COMPRESSEDTEXFORMAT_BC3_UNORM_BLOCK: decompressBc3 (dst, src); break; case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK: decompressBc3 (dst, src); break; case COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK: decompressBc4 (dst, src, false); break; case COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK: decompressBc4 (dst, src, true); break; case COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK: decompressBc5 (dst, src, false); break; case COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK: decompressBc5 (dst, src, true); break; case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK: decompressBc6H (dst, src, false); break; case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK: decompressBc6H (dst, src, true); break; case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK: decompressBc7 (dst, src); break; case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: decompressBc7 (dst, src); break; default: DE_FATAL("Unexpected format"); break; } } int componentSum (const IVec3& vec) { return vec.x() + vec.y() + vec.z(); } } // anonymous void decompress (const PixelBufferAccess& dst, CompressedTexFormat fmt, const deUint8* src, const TexDecompressionParams& params) { const int blockSize = getBlockSize(fmt); const IVec3 blockPixelSize (getBlockPixelSize(fmt)); const IVec3 blockCount (deDivRoundUp32(dst.getWidth(), blockPixelSize.x()), deDivRoundUp32(dst.getHeight(), blockPixelSize.y()), deDivRoundUp32(dst.getDepth(), blockPixelSize.z())); const IVec3 blockPitches (blockSize, blockSize * blockCount.x(), blockSize * blockCount.x() * blockCount.y()); std::vector uncompressedBlock (dst.getFormat().getPixelSize() * blockPixelSize.x() * blockPixelSize.y() * blockPixelSize.z()); const PixelBufferAccess blockAccess (getUncompressedFormat(fmt), blockPixelSize.x(), blockPixelSize.y(), blockPixelSize.z(), &uncompressedBlock[0]); DE_ASSERT(dst.getFormat() == getUncompressedFormat(fmt)); for (int blockZ = 0; blockZ < blockCount.z(); blockZ++) for (int blockY = 0; blockY < blockCount.y(); blockY++) for (int blockX = 0; blockX < blockCount.x(); blockX++) { const IVec3 blockPos (blockX, blockY, blockZ); const deUint8* const blockPtr = src + componentSum(blockPos * blockPitches); const IVec3 copySize (de::min(blockPixelSize.x(), dst.getWidth() - blockPos.x() * blockPixelSize.x()), de::min(blockPixelSize.y(), dst.getHeight() - blockPos.y() * blockPixelSize.y()), de::min(blockPixelSize.z(), dst.getDepth() - blockPos.z() * blockPixelSize.z())); const IVec3 dstPixelPos = blockPos * blockPixelSize; decompressBlock(fmt, blockAccess, blockPtr, params); copy(getSubregion(dst, dstPixelPos.x(), dstPixelPos.y(), dstPixelPos.z(), copySize.x(), copySize.y(), copySize.z()), getSubregion(blockAccess, 0, 0, 0, copySize.x(), copySize.y(), copySize.z())); } } CompressedTexture::CompressedTexture (void) : m_format (COMPRESSEDTEXFORMAT_LAST) , m_width (0) , m_height (0) , m_depth (0) { } CompressedTexture::CompressedTexture (CompressedTexFormat format, int width, int height, int depth) : m_format (COMPRESSEDTEXFORMAT_LAST) , m_width (0) , m_height (0) , m_depth (0) { setStorage(format, width, height, depth); } CompressedTexture::~CompressedTexture (void) { } void CompressedTexture::setStorage (CompressedTexFormat format, int width, int height, int depth) { m_format = format; m_width = width; m_height = height; m_depth = depth; if (m_format != COMPRESSEDTEXFORMAT_LAST) { const IVec3 blockPixelSize = getBlockPixelSize(m_format); const int blockSize = getBlockSize(m_format); m_data.resize(deDivRoundUp32(m_width, blockPixelSize.x()) * deDivRoundUp32(m_height, blockPixelSize.y()) * deDivRoundUp32(m_depth, blockPixelSize.z()) * blockSize); } else { DE_ASSERT(m_format == COMPRESSEDTEXFORMAT_LAST); DE_ASSERT(m_width == 0 && m_height == 0 && m_depth == 0); m_data.resize(0); } } /*--------------------------------------------------------------------*//*! * \brief Decode to uncompressed pixel data * \param dst Destination buffer *//*--------------------------------------------------------------------*/ void CompressedTexture::decompress (const PixelBufferAccess& dst, const TexDecompressionParams& params) const { DE_ASSERT(dst.getWidth() == m_width && dst.getHeight() == m_height && dst.getDepth() == m_depth); DE_ASSERT(dst.getFormat() == getUncompressedFormat(m_format)); tcu::decompress(dst, m_format, &m_data[0], params); } } // tcu