| /*------------------------------------------------------------------------- |
| * drawElements Quality Program Tester Core |
| * ---------------------------------------- |
| * |
| * Copyright 2014 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| * |
| *//*! |
| * \file |
| * \brief Compressed Texture Utilities. |
| *//*--------------------------------------------------------------------*/ |
| |
| #include "tcuCompressedTexture.hpp" |
| #include "tcuTextureUtil.hpp" |
| #include "tcuAstcUtil.hpp" |
| |
| #include "deStringUtil.hpp" |
| #include "deFloat16.h" |
| |
| #include <algorithm> |
| |
| namespace tcu |
| { |
| |
| int getBlockSize (CompressedTexFormat format) |
| { |
| if (isAstcFormat(format)) |
| { |
| return astc::BLOCK_SIZE_BYTES; |
| } |
| else if (isEtcFormat(format)) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_ETC1_RGB8: return 8; |
| case COMPRESSEDTEXFORMAT_EAC_R11: return 8; |
| case COMPRESSEDTEXFORMAT_EAC_SIGNED_R11: return 8; |
| case COMPRESSEDTEXFORMAT_EAC_RG11: return 16; |
| case COMPRESSEDTEXFORMAT_EAC_SIGNED_RG11: return 16; |
| case COMPRESSEDTEXFORMAT_ETC2_RGB8: return 8; |
| case COMPRESSEDTEXFORMAT_ETC2_SRGB8: return 8; |
| case COMPRESSEDTEXFORMAT_ETC2_RGB8_PUNCHTHROUGH_ALPHA1: return 8; |
| case COMPRESSEDTEXFORMAT_ETC2_SRGB8_PUNCHTHROUGH_ALPHA1: return 8; |
| case COMPRESSEDTEXFORMAT_ETC2_EAC_RGBA8: return 16; |
| case COMPRESSEDTEXFORMAT_ETC2_EAC_SRGB8_ALPHA8: return 16; |
| |
| default: |
| DE_ASSERT(false); |
| return -1; |
| } |
| } |
| else if (isBcFormat(format)) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_BC1_RGB_UNORM_BLOCK: return 8; |
| case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK: return 8; |
| case COMPRESSEDTEXFORMAT_BC1_RGBA_UNORM_BLOCK: return 8; |
| case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK: return 8; |
| case COMPRESSEDTEXFORMAT_BC2_UNORM_BLOCK: return 16; |
| case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK: return 16; |
| case COMPRESSEDTEXFORMAT_BC3_UNORM_BLOCK: return 16; |
| case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK: return 16; |
| case COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK: return 8; |
| case COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK: return 8; |
| case COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK: return 16; |
| case COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK: return 16; |
| case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK: return 16; |
| case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK: return 16; |
| case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK: return 16; |
| case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: return 16; |
| |
| default: |
| DE_ASSERT(false); |
| return -1; |
| } |
| } |
| else |
| { |
| DE_ASSERT(false); |
| return -1; |
| } |
| } |
| |
| IVec3 getBlockPixelSize (CompressedTexFormat format) |
| { |
| if (isEtcFormat(format)) |
| { |
| return IVec3(4, 4, 1); |
| } |
| else if (isAstcFormat(format)) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_ASTC_4x4_RGBA: return IVec3(4, 4, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_5x4_RGBA: return IVec3(5, 4, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_5x5_RGBA: return IVec3(5, 5, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_6x5_RGBA: return IVec3(6, 5, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_6x6_RGBA: return IVec3(6, 6, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_8x5_RGBA: return IVec3(8, 5, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_8x6_RGBA: return IVec3(8, 6, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_8x8_RGBA: return IVec3(8, 8, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_10x5_RGBA: return IVec3(10, 5, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_10x6_RGBA: return IVec3(10, 6, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_10x8_RGBA: return IVec3(10, 8, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_10x10_RGBA: return IVec3(10, 10, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_12x10_RGBA: return IVec3(12, 10, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_12x12_RGBA: return IVec3(12, 12, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_4x4_SRGB8_ALPHA8: return IVec3(4, 4, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_5x4_SRGB8_ALPHA8: return IVec3(5, 4, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_5x5_SRGB8_ALPHA8: return IVec3(5, 5, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_6x5_SRGB8_ALPHA8: return IVec3(6, 5, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_6x6_SRGB8_ALPHA8: return IVec3(6, 6, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_8x5_SRGB8_ALPHA8: return IVec3(8, 5, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_8x6_SRGB8_ALPHA8: return IVec3(8, 6, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_8x8_SRGB8_ALPHA8: return IVec3(8, 8, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_10x5_SRGB8_ALPHA8: return IVec3(10, 5, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_10x6_SRGB8_ALPHA8: return IVec3(10, 6, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_10x8_SRGB8_ALPHA8: return IVec3(10, 8, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_10x10_SRGB8_ALPHA8: return IVec3(10, 10, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_12x10_SRGB8_ALPHA8: return IVec3(12, 10, 1); |
| case COMPRESSEDTEXFORMAT_ASTC_12x12_SRGB8_ALPHA8: return IVec3(12, 12, 1); |
| |
| default: |
| DE_ASSERT(false); |
| return IVec3(); |
| } |
| } |
| else if (isBcFormat(format)) |
| { |
| return IVec3(4, 4, 1); |
| } |
| else |
| { |
| DE_ASSERT(false); |
| return IVec3(-1); |
| } |
| } |
| |
| bool isEtcFormat (CompressedTexFormat format) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_ETC1_RGB8: |
| case COMPRESSEDTEXFORMAT_EAC_R11: |
| case COMPRESSEDTEXFORMAT_EAC_SIGNED_R11: |
| case COMPRESSEDTEXFORMAT_EAC_RG11: |
| case COMPRESSEDTEXFORMAT_EAC_SIGNED_RG11: |
| case COMPRESSEDTEXFORMAT_ETC2_RGB8: |
| case COMPRESSEDTEXFORMAT_ETC2_SRGB8: |
| case COMPRESSEDTEXFORMAT_ETC2_RGB8_PUNCHTHROUGH_ALPHA1: |
| case COMPRESSEDTEXFORMAT_ETC2_SRGB8_PUNCHTHROUGH_ALPHA1: |
| case COMPRESSEDTEXFORMAT_ETC2_EAC_RGBA8: |
| case COMPRESSEDTEXFORMAT_ETC2_EAC_SRGB8_ALPHA8: |
| return true; |
| |
| default: |
| return false; |
| } |
| } |
| |
| bool isBcFormat (CompressedTexFormat format) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_BC1_RGB_UNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC1_RGBA_UNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC2_UNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC3_UNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: |
| return true; |
| |
| default: |
| return false; |
| } |
| } |
| |
| bool isBcBitExactFormat (CompressedTexFormat format) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: |
| return true; |
| |
| default: |
| return false; |
| } |
| } |
| |
| bool isBcSRGBFormat (CompressedTexFormat format) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK: |
| case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: |
| return true; |
| |
| default: |
| return false; |
| } |
| } |
| |
| bool isAstcFormat (CompressedTexFormat format) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_ASTC_4x4_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_5x4_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_5x5_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_6x5_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_6x6_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_8x5_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_8x6_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_8x8_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_10x5_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_10x6_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_10x8_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_10x10_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_12x10_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_12x12_RGBA: |
| case COMPRESSEDTEXFORMAT_ASTC_4x4_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_5x4_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_5x5_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_6x5_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_6x6_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_8x5_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_8x6_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_8x8_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_10x5_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_10x6_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_10x8_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_10x10_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_12x10_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_12x12_SRGB8_ALPHA8: |
| return true; |
| |
| default: |
| return false; |
| } |
| } |
| |
| bool isAstcSRGBFormat (CompressedTexFormat format) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_ASTC_4x4_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_5x4_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_5x5_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_6x5_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_6x6_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_8x5_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_8x6_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_8x8_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_10x5_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_10x6_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_10x8_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_10x10_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_12x10_SRGB8_ALPHA8: |
| case COMPRESSEDTEXFORMAT_ASTC_12x12_SRGB8_ALPHA8: |
| return true; |
| |
| default: |
| return false; |
| } |
| } |
| |
| TextureFormat getUncompressedFormat (CompressedTexFormat format) |
| { |
| if (isEtcFormat(format)) |
| { |
| switch (format) |
| { |
| case COMPRESSEDTEXFORMAT_ETC1_RGB8: return TextureFormat(TextureFormat::RGB, TextureFormat::UNORM_INT8); |
| case COMPRESSEDTEXFORMAT_EAC_R11: return TextureFormat(TextureFormat::R, TextureFormat::UNORM_INT16); |
| case COMPRESSEDTEXFORMAT_EAC_SIGNED_R11: return TextureFormat(TextureFormat::R, TextureFormat::SNORM_INT16); |
| case COMPRESSEDTEXFORMAT_EAC_RG11: return TextureFormat(TextureFormat::RG, TextureFormat::UNORM_INT16); |
| case COMPRESSEDTEXFORMAT_EAC_SIGNED_RG11: return TextureFormat(TextureFormat::RG, TextureFormat::SNORM_INT16); |
| case COMPRESSEDTEXFORMAT_ETC2_RGB8: return TextureFormat(TextureFormat::RGB, TextureFormat::UNORM_INT8); |
| case COMPRESSEDTEXFORMAT_ETC2_SRGB8: return TextureFormat(TextureFormat::sRGB, TextureFormat::UNORM_INT8); |
| case COMPRESSEDTEXFORMAT_ETC2_RGB8_PUNCHTHROUGH_ALPHA1: return TextureFormat(TextureFormat::RGBA, TextureFormat::UNORM_INT8); |
| case COMPRESSEDTEXFORMAT_ETC2_SRGB8_PUNCHTHROUGH_ALPHA1: return TextureFormat(TextureFormat::sRGBA, TextureFormat::UNORM_INT8); |
| case COMPRESSEDTEXFORMAT_ETC2_EAC_RGBA8: return TextureFormat(TextureFormat::RGBA, TextureFormat::UNORM_INT8); |
| case COMPRESSEDTEXFORMAT_ETC2_EAC_SRGB8_ALPHA8: return TextureFormat(TextureFormat::sRGBA, TextureFormat::UNORM_INT8); |
| |
| default: |
| DE_ASSERT(false); |
| return TextureFormat(); |
| } |
| } |
| else if (isAstcFormat(format)) |
| { |
| if (isAstcSRGBFormat(format)) |
| return TextureFormat(TextureFormat::sRGBA, TextureFormat::UNORM_INT8); |
| else |
| return TextureFormat(TextureFormat::RGBA, TextureFormat::HALF_FLOAT); |
| } |
| else if (isBcFormat(format)) |
| { |
| if (format == COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK || format == COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK) |
| return TextureFormat(TextureFormat::R, TextureFormat::FLOAT); |
| else if (format == COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK || format == COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK) |
| return TextureFormat(TextureFormat::RG, TextureFormat::FLOAT); |
| else if (format == COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK || format == COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK) |
| return TextureFormat(TextureFormat::RGB, TextureFormat::HALF_FLOAT); |
| else if (isBcSRGBFormat(format)) |
| return TextureFormat(TextureFormat::sRGBA, TextureFormat::UNORM_INT8); |
| else |
| return TextureFormat(TextureFormat::RGBA, TextureFormat::UNORM_INT8); |
| } |
| else |
| { |
| DE_ASSERT(false); |
| return TextureFormat(); |
| } |
| } |
| |
| CompressedTexFormat getAstcFormatByBlockSize (const IVec3& size, bool isSRGB) |
| { |
| if (size.z() > 1) |
| throw InternalError("3D ASTC textures not currently supported"); |
| |
| for (int fmtI = 0; fmtI < COMPRESSEDTEXFORMAT_LAST; fmtI++) |
| { |
| const CompressedTexFormat fmt = (CompressedTexFormat)fmtI; |
| |
| if (isAstcFormat(fmt) && getBlockPixelSize(fmt) == size && isAstcSRGBFormat(fmt) == isSRGB) |
| return fmt; |
| } |
| |
| throw InternalError("Invalid ASTC block size " + de::toString(size.x()) + "x" + de::toString(size.y()) + "x" + de::toString(size.z())); |
| } |
| |
| namespace |
| { |
| |
| inline deUint8 extend4To8 (deUint8 src) |
| { |
| DE_ASSERT((src & ~((1<<4)-1)) == 0); |
| return (deUint8)((src << 4) | src); |
| } |
| |
| inline deUint8 extend5To8 (deUint8 src) |
| { |
| DE_ASSERT((src & ~((1<<5)-1)) == 0); |
| return (deUint8)((src << 3) | (src >> 2)); |
| } |
| |
| inline deUint8 extend6To8 (deUint8 src) |
| { |
| DE_ASSERT((src & ~((1<<6)-1)) == 0); |
| return (deUint8)((src << 2) | (src >> 4)); |
| } |
| |
| // \todo [2013-08-06 nuutti] ETC and ASTC decompression codes are rather unrelated, and are already in their own "private" namespaces - should this be split to multiple files? |
| |
| namespace EtcDecompressInternal |
| { |
| |
| enum |
| { |
| ETC2_BLOCK_WIDTH = 4, |
| ETC2_BLOCK_HEIGHT = 4, |
| ETC2_UNCOMPRESSED_PIXEL_SIZE_A8 = 1, |
| ETC2_UNCOMPRESSED_PIXEL_SIZE_R11 = 2, |
| ETC2_UNCOMPRESSED_PIXEL_SIZE_RG11 = 4, |
| ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8 = 3, |
| ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8 = 4, |
| ETC2_UNCOMPRESSED_BLOCK_SIZE_A8 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8, |
| ETC2_UNCOMPRESSED_BLOCK_SIZE_R11 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11, |
| ETC2_UNCOMPRESSED_BLOCK_SIZE_RG11 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_RG11, |
| ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8, |
| ETC2_UNCOMPRESSED_BLOCK_SIZE_RGBA8 = ETC2_BLOCK_WIDTH*ETC2_BLOCK_HEIGHT*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8 |
| }; |
| |
| inline deUint64 get64BitBlock (const deUint8* src, int blockNdx) |
| { |
| // Stored in big-endian form. |
| deUint64 block = 0; |
| |
| for (int i = 0; i < 8; i++) |
| block = (block << 8ull) | (deUint64)(src[blockNdx*8+i]); |
| |
| return block; |
| } |
| |
| // Return the first 64 bits of a 128 bit block. |
| inline deUint64 get128BitBlockStart (const deUint8* src, int blockNdx) |
| { |
| return get64BitBlock(src, 2*blockNdx); |
| } |
| |
| // Return the last 64 bits of a 128 bit block. |
| inline deUint64 get128BitBlockEnd (const deUint8* src, int blockNdx) |
| { |
| return get64BitBlock(src, 2*blockNdx + 1); |
| } |
| |
| inline deUint32 getBit (deUint64 src, int bit) |
| { |
| return (src >> bit) & 1; |
| } |
| |
| inline deUint32 getBits (deUint64 src, int low, int high) |
| { |
| const int numBits = (high-low) + 1; |
| DE_ASSERT(de::inRange(numBits, 1, 32)); |
| if (numBits < 32) |
| return (deUint32)((src >> low) & ((1u<<numBits)-1)); |
| else |
| return (deUint32)((src >> low) & 0xFFFFFFFFu); |
| } |
| |
| inline deUint8 extend7To8 (deUint8 src) |
| { |
| DE_ASSERT((src & ~((1<<7)-1)) == 0); |
| return (deUint8)((src << 1) | (src >> 6)); |
| } |
| |
| inline deInt8 extendSigned3To8 (deUint8 src) |
| { |
| const bool isNeg = (src & (1<<2)) != 0; |
| return (deInt8)((isNeg ? ~((1<<3)-1) : 0) | src); |
| } |
| |
| inline deUint8 extend5Delta3To8 (deUint8 base5, deUint8 delta3) |
| { |
| const deUint8 t = (deUint8)((deInt8)base5 + extendSigned3To8(delta3)); |
| return extend5To8(t); |
| } |
| |
| inline deUint16 extend11To16 (deUint16 src) |
| { |
| DE_ASSERT((src & ~((1<<11)-1)) == 0); |
| return (deUint16)((src << 5) | (src >> 6)); |
| } |
| |
| inline deInt16 extend11To16WithSign (deInt16 src) |
| { |
| if (src < 0) |
| return (deInt16)(-(deInt16)extend11To16((deUint16)(-src))); |
| else |
| return (deInt16)extend11To16(src); |
| } |
| |
| void decompressETC1Block (deUint8 dst[ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8], deUint64 src) |
| { |
| const int diffBit = (int)getBit(src, 33); |
| const int flipBit = (int)getBit(src, 32); |
| const deUint32 table[2] = { getBits(src, 37, 39), getBits(src, 34, 36) }; |
| deUint8 baseR[2]; |
| deUint8 baseG[2]; |
| deUint8 baseB[2]; |
| |
| if (diffBit == 0) |
| { |
| // Individual mode. |
| baseR[0] = extend4To8((deUint8)getBits(src, 60, 63)); |
| baseR[1] = extend4To8((deUint8)getBits(src, 56, 59)); |
| baseG[0] = extend4To8((deUint8)getBits(src, 52, 55)); |
| baseG[1] = extend4To8((deUint8)getBits(src, 48, 51)); |
| baseB[0] = extend4To8((deUint8)getBits(src, 44, 47)); |
| baseB[1] = extend4To8((deUint8)getBits(src, 40, 43)); |
| } |
| else |
| { |
| // Differential mode (diffBit == 1). |
| deUint8 bR = (deUint8)getBits(src, 59, 63); // 5b |
| deUint8 dR = (deUint8)getBits(src, 56, 58); // 3b |
| deUint8 bG = (deUint8)getBits(src, 51, 55); |
| deUint8 dG = (deUint8)getBits(src, 48, 50); |
| deUint8 bB = (deUint8)getBits(src, 43, 47); |
| deUint8 dB = (deUint8)getBits(src, 40, 42); |
| |
| baseR[0] = extend5To8(bR); |
| baseG[0] = extend5To8(bG); |
| baseB[0] = extend5To8(bB); |
| |
| baseR[1] = extend5Delta3To8(bR, dR); |
| baseG[1] = extend5Delta3To8(bG, dG); |
| baseB[1] = extend5Delta3To8(bB, dB); |
| } |
| |
| static const int modifierTable[8][4] = |
| { |
| // 00 01 10 11 |
| { 2, 8, -2, -8 }, |
| { 5, 17, -5, -17 }, |
| { 9, 29, -9, -29 }, |
| { 13, 42, -13, -42 }, |
| { 18, 60, -18, -60 }, |
| { 24, 80, -24, -80 }, |
| { 33, 106, -33, -106 }, |
| { 47, 183, -47, -183 } |
| }; |
| |
| // Write final pixels. |
| for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) |
| { |
| const int x = pixelNdx / ETC2_BLOCK_HEIGHT; |
| const int y = pixelNdx % ETC2_BLOCK_HEIGHT; |
| const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8; |
| const int subBlock = ((flipBit ? y : x) >= 2) ? 1 : 0; |
| const deUint32 tableNdx = table[subBlock]; |
| const deUint32 modifierNdx = (getBit(src, 16+pixelNdx) << 1) | getBit(src, pixelNdx); |
| const int modifier = modifierTable[tableNdx][modifierNdx]; |
| |
| dst[dstOffset+0] = (deUint8)deClamp32((int)baseR[subBlock] + modifier, 0, 255); |
| dst[dstOffset+1] = (deUint8)deClamp32((int)baseG[subBlock] + modifier, 0, 255); |
| dst[dstOffset+2] = (deUint8)deClamp32((int)baseB[subBlock] + modifier, 0, 255); |
| } |
| } |
| |
| // if alphaMode is true, do PUNCHTHROUGH and store alpha to alphaDst; otherwise do ordinary ETC2 RGB8. |
| void decompressETC2Block (deUint8 dst[ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8], deUint64 src, deUint8 alphaDst[ETC2_UNCOMPRESSED_BLOCK_SIZE_A8], bool alphaMode) |
| { |
| enum Etc2Mode |
| { |
| MODE_INDIVIDUAL = 0, |
| MODE_DIFFERENTIAL, |
| MODE_T, |
| MODE_H, |
| MODE_PLANAR, |
| |
| MODE_LAST |
| }; |
| |
| const int diffOpaqueBit = (int)getBit(src, 33); |
| const deInt8 selBR = (deInt8)getBits(src, 59, 63); // 5 bits. |
| const deInt8 selBG = (deInt8)getBits(src, 51, 55); |
| const deInt8 selBB = (deInt8)getBits(src, 43, 47); |
| const deInt8 selDR = extendSigned3To8((deUint8)getBits(src, 56, 58)); // 3 bits. |
| const deInt8 selDG = extendSigned3To8((deUint8)getBits(src, 48, 50)); |
| const deInt8 selDB = extendSigned3To8((deUint8)getBits(src, 40, 42)); |
| Etc2Mode mode; |
| |
| if (!alphaMode && diffOpaqueBit == 0) |
| mode = MODE_INDIVIDUAL; |
| else if (!de::inRange(selBR + selDR, 0, 31)) |
| mode = MODE_T; |
| else if (!de::inRange(selBG + selDG, 0, 31)) |
| mode = MODE_H; |
| else if (!de::inRange(selBB + selDB, 0, 31)) |
| mode = MODE_PLANAR; |
| else |
| mode = MODE_DIFFERENTIAL; |
| |
| if (mode == MODE_INDIVIDUAL || mode == MODE_DIFFERENTIAL) |
| { |
| // Individual and differential modes have some steps in common, handle them here. |
| static const int modifierTable[8][4] = |
| { |
| // 00 01 10 11 |
| { 2, 8, -2, -8 }, |
| { 5, 17, -5, -17 }, |
| { 9, 29, -9, -29 }, |
| { 13, 42, -13, -42 }, |
| { 18, 60, -18, -60 }, |
| { 24, 80, -24, -80 }, |
| { 33, 106, -33, -106 }, |
| { 47, 183, -47, -183 } |
| }; |
| |
| const int flipBit = (int)getBit(src, 32); |
| const deUint32 table[2] = { getBits(src, 37, 39), getBits(src, 34, 36) }; |
| deUint8 baseR[2]; |
| deUint8 baseG[2]; |
| deUint8 baseB[2]; |
| |
| if (mode == MODE_INDIVIDUAL) |
| { |
| // Individual mode, initial values. |
| baseR[0] = extend4To8((deUint8)getBits(src, 60, 63)); |
| baseR[1] = extend4To8((deUint8)getBits(src, 56, 59)); |
| baseG[0] = extend4To8((deUint8)getBits(src, 52, 55)); |
| baseG[1] = extend4To8((deUint8)getBits(src, 48, 51)); |
| baseB[0] = extend4To8((deUint8)getBits(src, 44, 47)); |
| baseB[1] = extend4To8((deUint8)getBits(src, 40, 43)); |
| } |
| else |
| { |
| // Differential mode, initial values. |
| baseR[0] = extend5To8(selBR); |
| baseG[0] = extend5To8(selBG); |
| baseB[0] = extend5To8(selBB); |
| |
| baseR[1] = extend5To8((deUint8)(selBR + selDR)); |
| baseG[1] = extend5To8((deUint8)(selBG + selDG)); |
| baseB[1] = extend5To8((deUint8)(selBB + selDB)); |
| } |
| |
| // Write final pixels for individual or differential mode. |
| for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) |
| { |
| const int x = pixelNdx / ETC2_BLOCK_HEIGHT; |
| const int y = pixelNdx % ETC2_BLOCK_HEIGHT; |
| const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8; |
| const int subBlock = ((flipBit ? y : x) >= 2) ? 1 : 0; |
| const deUint32 tableNdx = table[subBlock]; |
| const deUint32 modifierNdx = (getBit(src, 16+pixelNdx) << 1) | getBit(src, pixelNdx); |
| const int alphaDstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8; // Only needed for PUNCHTHROUGH version. |
| |
| // If doing PUNCHTHROUGH version (alphaMode), opaque bit may affect colors. |
| if (alphaMode && diffOpaqueBit == 0 && modifierNdx == 2) |
| { |
| dst[dstOffset+0] = 0; |
| dst[dstOffset+1] = 0; |
| dst[dstOffset+2] = 0; |
| alphaDst[alphaDstOffset] = 0; |
| } |
| else |
| { |
| int modifier; |
| |
| // PUNCHTHROUGH version and opaque bit may also affect modifiers. |
| if (alphaMode && diffOpaqueBit == 0 && (modifierNdx == 0 || modifierNdx == 2)) |
| modifier = 0; |
| else |
| modifier = modifierTable[tableNdx][modifierNdx]; |
| |
| dst[dstOffset+0] = (deUint8)deClamp32((int)baseR[subBlock] + modifier, 0, 255); |
| dst[dstOffset+1] = (deUint8)deClamp32((int)baseG[subBlock] + modifier, 0, 255); |
| dst[dstOffset+2] = (deUint8)deClamp32((int)baseB[subBlock] + modifier, 0, 255); |
| |
| if (alphaMode) |
| alphaDst[alphaDstOffset] = 255; |
| } |
| } |
| } |
| else if (mode == MODE_T || mode == MODE_H) |
| { |
| // T and H modes have some steps in common, handle them here. |
| static const int distTable[8] = { 3, 6, 11, 16, 23, 32, 41, 64 }; |
| |
| deUint8 paintR[4]; |
| deUint8 paintG[4]; |
| deUint8 paintB[4]; |
| |
| if (mode == MODE_T) |
| { |
| // T mode, calculate paint values. |
| const deUint8 R1a = (deUint8)getBits(src, 59, 60); |
| const deUint8 R1b = (deUint8)getBits(src, 56, 57); |
| const deUint8 G1 = (deUint8)getBits(src, 52, 55); |
| const deUint8 B1 = (deUint8)getBits(src, 48, 51); |
| const deUint8 R2 = (deUint8)getBits(src, 44, 47); |
| const deUint8 G2 = (deUint8)getBits(src, 40, 43); |
| const deUint8 B2 = (deUint8)getBits(src, 36, 39); |
| const deUint32 distNdx = (getBits(src, 34, 35) << 1) | getBit(src, 32); |
| const int dist = distTable[distNdx]; |
| |
| paintR[0] = extend4To8((deUint8)((R1a << 2) | R1b)); |
| paintG[0] = extend4To8(G1); |
| paintB[0] = extend4To8(B1); |
| paintR[2] = extend4To8(R2); |
| paintG[2] = extend4To8(G2); |
| paintB[2] = extend4To8(B2); |
| paintR[1] = (deUint8)deClamp32((int)paintR[2] + dist, 0, 255); |
| paintG[1] = (deUint8)deClamp32((int)paintG[2] + dist, 0, 255); |
| paintB[1] = (deUint8)deClamp32((int)paintB[2] + dist, 0, 255); |
| paintR[3] = (deUint8)deClamp32((int)paintR[2] - dist, 0, 255); |
| paintG[3] = (deUint8)deClamp32((int)paintG[2] - dist, 0, 255); |
| paintB[3] = (deUint8)deClamp32((int)paintB[2] - dist, 0, 255); |
| } |
| else |
| { |
| // H mode, calculate paint values. |
| const deUint8 R1 = (deUint8)getBits(src, 59, 62); |
| const deUint8 G1a = (deUint8)getBits(src, 56, 58); |
| const deUint8 G1b = (deUint8)getBit(src, 52); |
| const deUint8 B1a = (deUint8)getBit(src, 51); |
| const deUint8 B1b = (deUint8)getBits(src, 47, 49); |
| const deUint8 R2 = (deUint8)getBits(src, 43, 46); |
| const deUint8 G2 = (deUint8)getBits(src, 39, 42); |
| const deUint8 B2 = (deUint8)getBits(src, 35, 38); |
| deUint8 baseR[2]; |
| deUint8 baseG[2]; |
| deUint8 baseB[2]; |
| deUint32 baseValue[2]; |
| deUint32 distNdx; |
| int dist; |
| |
| baseR[0] = extend4To8(R1); |
| baseG[0] = extend4To8((deUint8)((G1a << 1) | G1b)); |
| baseB[0] = extend4To8((deUint8)((B1a << 3) | B1b)); |
| baseR[1] = extend4To8(R2); |
| baseG[1] = extend4To8(G2); |
| baseB[1] = extend4To8(B2); |
| baseValue[0] = (((deUint32)baseR[0]) << 16) | (((deUint32)baseG[0]) << 8) | baseB[0]; |
| baseValue[1] = (((deUint32)baseR[1]) << 16) | (((deUint32)baseG[1]) << 8) | baseB[1]; |
| distNdx = (getBit(src, 34) << 2) | (getBit(src, 32) << 1) | (deUint32)(baseValue[0] >= baseValue[1]); |
| dist = distTable[distNdx]; |
| |
| paintR[0] = (deUint8)deClamp32((int)baseR[0] + dist, 0, 255); |
| paintG[0] = (deUint8)deClamp32((int)baseG[0] + dist, 0, 255); |
| paintB[0] = (deUint8)deClamp32((int)baseB[0] + dist, 0, 255); |
| paintR[1] = (deUint8)deClamp32((int)baseR[0] - dist, 0, 255); |
| paintG[1] = (deUint8)deClamp32((int)baseG[0] - dist, 0, 255); |
| paintB[1] = (deUint8)deClamp32((int)baseB[0] - dist, 0, 255); |
| paintR[2] = (deUint8)deClamp32((int)baseR[1] + dist, 0, 255); |
| paintG[2] = (deUint8)deClamp32((int)baseG[1] + dist, 0, 255); |
| paintB[2] = (deUint8)deClamp32((int)baseB[1] + dist, 0, 255); |
| paintR[3] = (deUint8)deClamp32((int)baseR[1] - dist, 0, 255); |
| paintG[3] = (deUint8)deClamp32((int)baseG[1] - dist, 0, 255); |
| paintB[3] = (deUint8)deClamp32((int)baseB[1] - dist, 0, 255); |
| } |
| |
| // Write final pixels for T or H mode. |
| for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) |
| { |
| const int x = pixelNdx / ETC2_BLOCK_HEIGHT; |
| const int y = pixelNdx % ETC2_BLOCK_HEIGHT; |
| const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8; |
| const deUint32 paintNdx = (getBit(src, 16+pixelNdx) << 1) | getBit(src, pixelNdx); |
| const int alphaDstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8; // Only needed for PUNCHTHROUGH version. |
| |
| if (alphaMode && diffOpaqueBit == 0 && paintNdx == 2) |
| { |
| dst[dstOffset+0] = 0; |
| dst[dstOffset+1] = 0; |
| dst[dstOffset+2] = 0; |
| alphaDst[alphaDstOffset] = 0; |
| } |
| else |
| { |
| dst[dstOffset+0] = (deUint8)deClamp32((int)paintR[paintNdx], 0, 255); |
| dst[dstOffset+1] = (deUint8)deClamp32((int)paintG[paintNdx], 0, 255); |
| dst[dstOffset+2] = (deUint8)deClamp32((int)paintB[paintNdx], 0, 255); |
| |
| if (alphaMode) |
| alphaDst[alphaDstOffset] = 255; |
| } |
| } |
| } |
| else |
| { |
| // Planar mode. |
| const deUint8 GO1 = (deUint8)getBit(src, 56); |
| const deUint8 GO2 = (deUint8)getBits(src, 49, 54); |
| const deUint8 BO1 = (deUint8)getBit(src, 48); |
| const deUint8 BO2 = (deUint8)getBits(src, 43, 44); |
| const deUint8 BO3 = (deUint8)getBits(src, 39, 41); |
| const deUint8 RH1 = (deUint8)getBits(src, 34, 38); |
| const deUint8 RH2 = (deUint8)getBit(src, 32); |
| const deUint8 RO = extend6To8((deUint8)getBits(src, 57, 62)); |
| const deUint8 GO = extend7To8((deUint8)((GO1 << 6) | GO2)); |
| const deUint8 BO = extend6To8((deUint8)((BO1 << 5) | (BO2 << 3) | BO3)); |
| const deUint8 RH = extend6To8((deUint8)((RH1 << 1) | RH2)); |
| const deUint8 GH = extend7To8((deUint8)getBits(src, 25, 31)); |
| const deUint8 BH = extend6To8((deUint8)getBits(src, 19, 24)); |
| const deUint8 RV = extend6To8((deUint8)getBits(src, 13, 18)); |
| const deUint8 GV = extend7To8((deUint8)getBits(src, 6, 12)); |
| const deUint8 BV = extend6To8((deUint8)getBits(src, 0, 5)); |
| |
| // Write final pixels for planar mode. |
| for (int y = 0; y < 4; y++) |
| { |
| for (int x = 0; x < 4; x++) |
| { |
| const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8; |
| const int unclampedR = (x * ((int)RH-(int)RO) + y * ((int)RV-(int)RO) + 4*(int)RO + 2) >> 2; |
| const int unclampedG = (x * ((int)GH-(int)GO) + y * ((int)GV-(int)GO) + 4*(int)GO + 2) >> 2; |
| const int unclampedB = (x * ((int)BH-(int)BO) + y * ((int)BV-(int)BO) + 4*(int)BO + 2) >> 2; |
| const int alphaDstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8; // Only needed for PUNCHTHROUGH version. |
| |
| dst[dstOffset+0] = (deUint8)deClamp32(unclampedR, 0, 255); |
| dst[dstOffset+1] = (deUint8)deClamp32(unclampedG, 0, 255); |
| dst[dstOffset+2] = (deUint8)deClamp32(unclampedB, 0, 255); |
| |
| if (alphaMode) |
| alphaDst[alphaDstOffset] = 255; |
| } |
| } |
| } |
| } |
| |
| void decompressEAC8Block (deUint8 dst[ETC2_UNCOMPRESSED_BLOCK_SIZE_A8], deUint64 src) |
| { |
| static const int modifierTable[16][8] = |
| { |
| {-3, -6, -9, -15, 2, 5, 8, 14}, |
| {-3, -7, -10, -13, 2, 6, 9, 12}, |
| {-2, -5, -8, -13, 1, 4, 7, 12}, |
| {-2, -4, -6, -13, 1, 3, 5, 12}, |
| {-3, -6, -8, -12, 2, 5, 7, 11}, |
| {-3, -7, -9, -11, 2, 6, 8, 10}, |
| {-4, -7, -8, -11, 3, 6, 7, 10}, |
| {-3, -5, -8, -11, 2, 4, 7, 10}, |
| {-2, -6, -8, -10, 1, 5, 7, 9}, |
| {-2, -5, -8, -10, 1, 4, 7, 9}, |
| {-2, -4, -8, -10, 1, 3, 7, 9}, |
| {-2, -5, -7, -10, 1, 4, 6, 9}, |
| {-3, -4, -7, -10, 2, 3, 6, 9}, |
| {-1, -2, -3, -10, 0, 1, 2, 9}, |
| {-4, -6, -8, -9, 3, 5, 7, 8}, |
| {-3, -5, -7, -9, 2, 4, 6, 8} |
| }; |
| |
| const deUint8 baseCodeword = (deUint8)getBits(src, 56, 63); |
| const deUint8 multiplier = (deUint8)getBits(src, 52, 55); |
| const deUint32 tableNdx = getBits(src, 48, 51); |
| |
| for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) |
| { |
| const int x = pixelNdx / ETC2_BLOCK_HEIGHT; |
| const int y = pixelNdx % ETC2_BLOCK_HEIGHT; |
| const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8; |
| const int pixelBitNdx = 45 - 3*pixelNdx; |
| const deUint32 modifierNdx = (getBit(src, pixelBitNdx + 2) << 2) | (getBit(src, pixelBitNdx + 1) << 1) | getBit(src, pixelBitNdx); |
| const int modifier = modifierTable[tableNdx][modifierNdx]; |
| |
| dst[dstOffset] = (deUint8)deClamp32((int)baseCodeword + (int)multiplier*modifier, 0, 255); |
| } |
| } |
| |
| void decompressEAC11Block (deUint8 dst[ETC2_UNCOMPRESSED_BLOCK_SIZE_R11], deUint64 src, bool signedMode) |
| { |
| static const int modifierTable[16][8] = |
| { |
| {-3, -6, -9, -15, 2, 5, 8, 14}, |
| {-3, -7, -10, -13, 2, 6, 9, 12}, |
| {-2, -5, -8, -13, 1, 4, 7, 12}, |
| {-2, -4, -6, -13, 1, 3, 5, 12}, |
| {-3, -6, -8, -12, 2, 5, 7, 11}, |
| {-3, -7, -9, -11, 2, 6, 8, 10}, |
| {-4, -7, -8, -11, 3, 6, 7, 10}, |
| {-3, -5, -8, -11, 2, 4, 7, 10}, |
| {-2, -6, -8, -10, 1, 5, 7, 9}, |
| {-2, -5, -8, -10, 1, 4, 7, 9}, |
| {-2, -4, -8, -10, 1, 3, 7, 9}, |
| {-2, -5, -7, -10, 1, 4, 6, 9}, |
| {-3, -4, -7, -10, 2, 3, 6, 9}, |
| {-1, -2, -3, -10, 0, 1, 2, 9}, |
| {-4, -6, -8, -9, 3, 5, 7, 8}, |
| {-3, -5, -7, -9, 2, 4, 6, 8} |
| }; |
| |
| const deInt32 multiplier = (deInt32)getBits(src, 52, 55); |
| const deInt32 tableNdx = (deInt32)getBits(src, 48, 51); |
| deInt32 baseCodeword = (deInt32)getBits(src, 56, 63); |
| |
| if (signedMode) |
| { |
| if (baseCodeword > 127) |
| baseCodeword -= 256; |
| if (baseCodeword == -128) |
| baseCodeword = -127; |
| } |
| |
| for (int pixelNdx = 0; pixelNdx < ETC2_BLOCK_HEIGHT*ETC2_BLOCK_WIDTH; pixelNdx++) |
| { |
| const int x = pixelNdx / ETC2_BLOCK_HEIGHT; |
| const int y = pixelNdx % ETC2_BLOCK_HEIGHT; |
| const int dstOffset = (y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11; |
| const int pixelBitNdx = 45 - 3*pixelNdx; |
| const deUint32 modifierNdx = (getBit(src, pixelBitNdx + 2) << 2) | (getBit(src, pixelBitNdx + 1) << 1) | getBit(src, pixelBitNdx); |
| const int modifier = modifierTable[tableNdx][modifierNdx]; |
| |
| if (signedMode) |
| { |
| deInt16 value; |
| |
| if (multiplier != 0) |
| value = (deInt16)deClamp32(baseCodeword*8 + multiplier*modifier*8, -1023, 1023); |
| else |
| value = (deInt16)deClamp32(baseCodeword*8 + modifier, -1023, 1023); |
| |
| *((deInt16*)(dst + dstOffset)) = value; |
| } |
| else |
| { |
| deUint16 value; |
| |
| if (multiplier != 0) |
| value = (deUint16)deClamp32(baseCodeword*8 + 4 + multiplier*modifier*8, 0, 2047); |
| else |
| value= (deUint16)deClamp32(baseCodeword*8 + 4 + modifier, 0, 2047); |
| |
| *((deUint16*)(dst + dstOffset)) = value; |
| } |
| } |
| } |
| |
| } // EtcDecompressInternal |
| |
| void decompressETC1 (const PixelBufferAccess& dst, const deUint8* src) |
| { |
| using namespace EtcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const deUint64 compressedBlock = get64BitBlock(src, 0); |
| |
| decompressETC1Block(dstPtr, compressedBlock); |
| } |
| |
| void decompressETC2 (const PixelBufferAccess& dst, const deUint8* src) |
| { |
| using namespace EtcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const deUint64 compressedBlock = get64BitBlock(src, 0); |
| |
| decompressETC2Block(dstPtr, compressedBlock, NULL, false); |
| } |
| |
| void decompressETC2_EAC_RGBA8 (const PixelBufferAccess& dst, const deUint8* src) |
| { |
| using namespace EtcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const int dstRowPitch = dst.getRowPitch(); |
| const int dstPixelSize = ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8; |
| |
| const deUint64 compressedBlockAlpha = get128BitBlockStart(src, 0); |
| const deUint64 compressedBlockRGB = get128BitBlockEnd(src, 0); |
| deUint8 uncompressedBlockAlpha[ETC2_UNCOMPRESSED_BLOCK_SIZE_A8]; |
| deUint8 uncompressedBlockRGB[ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8]; |
| |
| // Decompress. |
| decompressETC2Block(uncompressedBlockRGB, compressedBlockRGB, NULL, false); |
| decompressEAC8Block(uncompressedBlockAlpha, compressedBlockAlpha); |
| |
| // Write to dst. |
| for (int y = 0; y < (int)ETC2_BLOCK_HEIGHT; y++) |
| { |
| for (int x = 0; x < (int)ETC2_BLOCK_WIDTH; x++) |
| { |
| const deUint8* const srcPixelRGB = &uncompressedBlockRGB[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8]; |
| const deUint8* const srcPixelAlpha = &uncompressedBlockAlpha[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8]; |
| deUint8* const dstPixel = dstPtr + y*dstRowPitch + x*dstPixelSize; |
| |
| DE_STATIC_ASSERT(ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8 == 4); |
| dstPixel[0] = srcPixelRGB[0]; |
| dstPixel[1] = srcPixelRGB[1]; |
| dstPixel[2] = srcPixelRGB[2]; |
| dstPixel[3] = srcPixelAlpha[0]; |
| } |
| } |
| } |
| |
| void decompressETC2_RGB8_PUNCHTHROUGH_ALPHA1 (const PixelBufferAccess& dst, const deUint8* src) |
| { |
| using namespace EtcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const int dstRowPitch = dst.getRowPitch(); |
| const int dstPixelSize = ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8; |
| |
| const deUint64 compressedBlockRGBA = get64BitBlock(src, 0); |
| deUint8 uncompressedBlockRGB[ETC2_UNCOMPRESSED_BLOCK_SIZE_RGB8]; |
| deUint8 uncompressedBlockAlpha[ETC2_UNCOMPRESSED_BLOCK_SIZE_A8]; |
| |
| // Decompress. |
| decompressETC2Block(uncompressedBlockRGB, compressedBlockRGBA, uncompressedBlockAlpha, DE_TRUE); |
| |
| // Write to dst. |
| for (int y = 0; y < (int)ETC2_BLOCK_HEIGHT; y++) |
| { |
| for (int x = 0; x < (int)ETC2_BLOCK_WIDTH; x++) |
| { |
| const deUint8* const srcPixel = &uncompressedBlockRGB[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_RGB8]; |
| const deUint8* const srcPixelAlpha = &uncompressedBlockAlpha[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_A8]; |
| deUint8* const dstPixel = dstPtr + y*dstRowPitch + x*dstPixelSize; |
| |
| DE_STATIC_ASSERT(ETC2_UNCOMPRESSED_PIXEL_SIZE_RGBA8 == 4); |
| dstPixel[0] = srcPixel[0]; |
| dstPixel[1] = srcPixel[1]; |
| dstPixel[2] = srcPixel[2]; |
| dstPixel[3] = srcPixelAlpha[0]; |
| } |
| } |
| } |
| |
| void decompressEAC_R11 (const PixelBufferAccess& dst, const deUint8* src, bool signedMode) |
| { |
| using namespace EtcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const int dstRowPitch = dst.getRowPitch(); |
| const int dstPixelSize = ETC2_UNCOMPRESSED_PIXEL_SIZE_R11; |
| |
| const deUint64 compressedBlock = get64BitBlock(src, 0); |
| deUint8 uncompressedBlock[ETC2_UNCOMPRESSED_BLOCK_SIZE_R11]; |
| |
| // Decompress. |
| decompressEAC11Block(uncompressedBlock, compressedBlock, signedMode); |
| |
| // Write to dst. |
| for (int y = 0; y < (int)ETC2_BLOCK_HEIGHT; y++) |
| { |
| for (int x = 0; x < (int)ETC2_BLOCK_WIDTH; x++) |
| { |
| DE_STATIC_ASSERT(ETC2_UNCOMPRESSED_PIXEL_SIZE_R11 == 2); |
| |
| if (signedMode) |
| { |
| const deInt16* const srcPixel = (deInt16*)&uncompressedBlock[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; |
| deInt16* const dstPixel = (deInt16*)(dstPtr + y*dstRowPitch + x*dstPixelSize); |
| |
| dstPixel[0] = extend11To16WithSign(srcPixel[0]); |
| } |
| else |
| { |
| const deUint16* const srcPixel = (deUint16*)&uncompressedBlock[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; |
| deUint16* const dstPixel = (deUint16*)(dstPtr + y*dstRowPitch + x*dstPixelSize); |
| |
| dstPixel[0] = extend11To16(srcPixel[0]); |
| } |
| } |
| } |
| } |
| |
| void decompressEAC_RG11 (const PixelBufferAccess& dst, const deUint8* src, bool signedMode) |
| { |
| using namespace EtcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const int dstRowPitch = dst.getRowPitch(); |
| const int dstPixelSize = ETC2_UNCOMPRESSED_PIXEL_SIZE_RG11; |
| |
| const deUint64 compressedBlockR = get128BitBlockStart(src, 0); |
| const deUint64 compressedBlockG = get128BitBlockEnd(src, 0); |
| deUint8 uncompressedBlockR[ETC2_UNCOMPRESSED_BLOCK_SIZE_R11]; |
| deUint8 uncompressedBlockG[ETC2_UNCOMPRESSED_BLOCK_SIZE_R11]; |
| |
| // Decompress. |
| decompressEAC11Block(uncompressedBlockR, compressedBlockR, signedMode); |
| decompressEAC11Block(uncompressedBlockG, compressedBlockG, signedMode); |
| |
| // Write to dst. |
| for (int y = 0; y < (int)ETC2_BLOCK_HEIGHT; y++) |
| { |
| for (int x = 0; x < (int)ETC2_BLOCK_WIDTH; x++) |
| { |
| DE_STATIC_ASSERT(ETC2_UNCOMPRESSED_PIXEL_SIZE_RG11 == 4); |
| |
| if (signedMode) |
| { |
| const deInt16* const srcPixelR = (deInt16*)&uncompressedBlockR[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; |
| const deInt16* const srcPixelG = (deInt16*)&uncompressedBlockG[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; |
| deInt16* const dstPixel = (deInt16*)(dstPtr + y*dstRowPitch + x*dstPixelSize); |
| |
| dstPixel[0] = extend11To16WithSign(srcPixelR[0]); |
| dstPixel[1] = extend11To16WithSign(srcPixelG[0]); |
| } |
| else |
| { |
| const deUint16* const srcPixelR = (deUint16*)&uncompressedBlockR[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; |
| const deUint16* const srcPixelG = (deUint16*)&uncompressedBlockG[(y*ETC2_BLOCK_WIDTH + x)*ETC2_UNCOMPRESSED_PIXEL_SIZE_R11]; |
| deUint16* const dstPixel = (deUint16*)(dstPtr + y*dstRowPitch + x*dstPixelSize); |
| |
| dstPixel[0] = extend11To16(srcPixelR[0]); |
| dstPixel[1] = extend11To16(srcPixelG[0]); |
| } |
| } |
| } |
| } |
| |
| namespace BcDecompressInternal |
| { |
| |
| enum |
| { |
| BC_BLOCK_WIDTH = 4, |
| BC_BLOCK_HEIGHT = 4 |
| }; |
| |
| static const deUint8 epBits[14] = { 10, 7, 11, 11, 11, 9, 8, 8, 8, 6, 10, 11, 12, 16 }; |
| |
| static const deUint8 partitions2[64][16] = |
| { |
| { 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1 }, |
| { 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1 }, |
| { 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1 }, |
| { 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1 }, |
| { 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1 }, |
| { 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1 }, |
| { 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1 }, |
| { 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1 }, |
| { 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1 }, |
| { 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1 }, |
| { 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0 }, |
| { 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0 }, |
| { 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 }, |
| { 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0 }, |
| { 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1 }, |
| { 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0 }, |
| { 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0 }, |
| { 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0 }, |
| { 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0 }, |
| { 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0 }, |
| { 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0 }, |
| { 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0 }, |
| { 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0 }, |
| { 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1 }, |
| { 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1 }, |
| { 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0 }, |
| { 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0 }, |
| { 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0 }, |
| { 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0 }, |
| { 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1 }, |
| { 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1 }, |
| { 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0 }, |
| { 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0 }, |
| { 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0 }, |
| { 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0 }, |
| { 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0 }, |
| { 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1 }, |
| { 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1 }, |
| { 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0 }, |
| { 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0 }, |
| { 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0 }, |
| { 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0 }, |
| { 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0 }, |
| { 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1 }, |
| { 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1 }, |
| { 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0 }, |
| { 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0 }, |
| { 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1 }, |
| { 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1 }, |
| { 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1 }, |
| { 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1 }, |
| { 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1 }, |
| { 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0 }, |
| { 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0 }, |
| { 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1 } |
| }; |
| |
| static const deUint8 partitions3[64][16] = |
| { |
| { 0, 0, 1, 1, 0, 0, 1, 1, 0, 2, 2, 1, 2, 2, 2, 2 }, |
| { 0, 0, 0, 1, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2, 2, 1 }, |
| { 0, 0, 0, 0, 2, 0, 0, 1, 2, 2, 1, 1, 2, 2, 1, 1 }, |
| { 0, 2, 2, 2, 0, 0, 2, 2, 0, 0, 1, 1, 0, 1, 1, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2 }, |
| { 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 2, 2, 0, 0, 2, 2 }, |
| { 0, 0, 2, 2, 0, 0, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1 }, |
| { 0, 0, 1, 1, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2, 1, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2 }, |
| { 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2 }, |
| { 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2 }, |
| { 0, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2 }, |
| { 0, 1, 1, 2, 0, 1, 1, 2, 0, 1, 1, 2, 0, 1, 1, 2 }, |
| { 0, 1, 2, 2, 0, 1, 2, 2, 0, 1, 2, 2, 0, 1, 2, 2 }, |
| { 0, 0, 1, 1, 0, 1, 1, 2, 1, 1, 2, 2, 1, 2, 2, 2 }, |
| { 0, 0, 1, 1, 2, 0, 0, 1, 2, 2, 0, 0, 2, 2, 2, 0 }, |
| { 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 2, 1, 1, 2, 2 }, |
| { 0, 1, 1, 1, 0, 0, 1, 1, 2, 0, 0, 1, 2, 2, 0, 0 }, |
| { 0, 0, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2, 1, 1, 2, 2 }, |
| { 0, 0, 2, 2, 0, 0, 2, 2, 0, 0, 2, 2, 1, 1, 1, 1 }, |
| { 0, 1, 1, 1, 0, 1, 1, 1, 0, 2, 2, 2, 0, 2, 2, 2 }, |
| { 0, 0, 0, 1, 0, 0, 0, 1, 2, 2, 2, 1, 2, 2, 2, 1 }, |
| { 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 2, 2, 0, 1, 2, 2 }, |
| { 0, 0, 0, 0, 1, 1, 0, 0, 2, 2, 1, 0, 2, 2, 1, 0 }, |
| { 0, 1, 2, 2, 0, 1, 2, 2, 0, 0, 1, 1, 0, 0, 0, 0 }, |
| { 0, 0, 1, 2, 0, 0, 1, 2, 1, 1, 2, 2, 2, 2, 2, 2 }, |
| { 0, 1, 1, 0, 1, 2, 2, 1, 1, 2, 2, 1, 0, 1, 1, 0 }, |
| { 0, 0, 0, 0, 0, 1, 1, 0, 1, 2, 2, 1, 1, 2, 2, 1 }, |
| { 0, 0, 2, 2, 1, 1, 0, 2, 1, 1, 0, 2, 0, 0, 2, 2 }, |
| { 0, 1, 1, 0, 0, 1, 1, 0, 2, 0, 0, 2, 2, 2, 2, 2 }, |
| { 0, 0, 1, 1, 0, 1, 2, 2, 0, 1, 2, 2, 0, 0, 1, 1 }, |
| { 0, 0, 0, 0, 2, 0, 0, 0, 2, 2, 1, 1, 2, 2, 2, 1 }, |
| { 0, 0, 0, 0, 0, 0, 0, 2, 1, 1, 2, 2, 1, 2, 2, 2 }, |
| { 0, 2, 2, 2, 0, 0, 2, 2, 0, 0, 1, 2, 0, 0, 1, 1 }, |
| { 0, 0, 1, 1, 0, 0, 1, 2, 0, 0, 2, 2, 0, 2, 2, 2 }, |
| { 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2, 0 }, |
| { 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 0, 0, 0, 0 }, |
| { 0, 1, 2, 0, 1, 2, 0, 1, 2, 0, 1, 2, 0, 1, 2, 0 }, |
| { 0, 1, 2, 0, 2, 0, 1, 2, 1, 2, 0, 1, 0, 1, 2, 0 }, |
| { 0, 0, 1, 1, 2, 2, 0, 0, 1, 1, 2, 2, 0, 0, 1, 1 }, |
| { 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 0, 0, 0, 0, 1, 1 }, |
| { 0, 1, 0, 1, 0, 1, 0, 1, 2, 2, 2, 2, 2, 2, 2, 2 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 2, 1, 2, 1, 2, 1 }, |
| { 0, 0, 2, 2, 1, 1, 2, 2, 0, 0, 2, 2, 1, 1, 2, 2 }, |
| { 0, 0, 2, 2, 0, 0, 1, 1, 0, 0, 2, 2, 0, 0, 1, 1 }, |
| { 0, 2, 2, 0, 1, 2, 2, 1, 0, 2, 2, 0, 1, 2, 2, 1 }, |
| { 0, 1, 0, 1, 2, 2, 2, 2, 2, 2, 2, 2, 0, 1, 0, 1 }, |
| { 0, 0, 0, 0, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1 }, |
| { 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 2, 2, 2, 2 }, |
| { 0, 2, 2, 2, 0, 1, 1, 1, 0, 2, 2, 2, 0, 1, 1, 1 }, |
| { 0, 0, 0, 2, 1, 1, 1, 2, 0, 0, 0, 2, 1, 1, 1, 2 }, |
| { 0, 0, 0, 0, 2, 1, 1, 2, 2, 1, 1, 2, 2, 1, 1, 2 }, |
| { 0, 2, 2, 2, 0, 1, 1, 1, 0, 1, 1, 1, 0, 2, 2, 2 }, |
| { 0, 0, 0, 2, 1, 1, 1, 2, 1, 1, 1, 2, 0, 0, 0, 2 }, |
| { 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 2, 2, 2, 2 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 1, 2, 2, 1, 1, 2 }, |
| { 0, 1, 1, 0, 0, 1, 1, 0, 2, 2, 2, 2, 2, 2, 2, 2 }, |
| { 0, 0, 2, 2, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 2, 2 }, |
| { 0, 0, 2, 2, 1, 1, 2, 2, 1, 1, 2, 2, 0, 0, 2, 2 }, |
| { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 1, 2 }, |
| { 0, 0, 0, 2, 0, 0, 0, 1, 0, 0, 0, 2, 0, 0, 0, 1 }, |
| { 0, 2, 2, 2, 1, 2, 2, 2, 0, 2, 2, 2, 1, 2, 2, 2 }, |
| { 0, 1, 0, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2 }, |
| { 0, 1, 1, 1, 2, 0, 1, 1, 2, 2, 0, 1, 2, 2, 2, 0 } |
| }; |
| |
| static const deUint8 anchorIndicesSecondSubset2[64] = { 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 2, 8, 2, 2, 8, 8, 15, 2, 8, 2, 2, 8, 8, 2, 2, |
| 15, 15, 6, 8, 2, 8, 15, 15, 2, 8, 2, 2, 2, 15, 15, 6, 6, 2, 6, 8, 15, 15, 2, 2, 15, 15, 15, 15, 15, 2, 2, 15 }; |
| |
| static const deUint8 anchorIndicesSecondSubset3[64] = { 3, 3, 15, 15, 8, 3, 15, 15, 8, 8, 6, 6, 6, 5, 3, 3, 3, 3, 8, 15, 3, 3, 6, 10, 5, 8, 8, 6, 8, 5, 15, 15, |
| 8, 15, 3, 5, 6, 10, 8, 15, 15, 3, 15, 5, 15, 15, 15, 15, 3, 15, 5, 5, 5, 8, 5, 10, 5, 10, 8, 13, 15, 12, 3, 3 }; |
| |
| static const deUint8 anchorIndicesThirdSubset[64] = { 15, 8, 8, 3, 15, 15, 3, 8, 15, 15, 15, 15, 15, 15, 15, 8, 15, 8, 15, 3, 15, 8, 15, 8, 3, 15, 6, 10, 15, 15, 10, 8, |
| 15, 3, 15, 10, 10, 8, 9, 10, 6, 15, 8, 15, 3, 6, 6, 8, 15, 3, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 3, 15, 15, 8 }; |
| |
| static const deUint16 weights2[4] = { 0, 21, 43, 64 }; |
| static const deUint16 weights3[8] = { 0, 9, 18, 27, 37, 46, 55, 64 }; |
| static const deUint16 weights4[16] = { 0, 4, 9, 13, 17, 21, 26, 30, 34, 38, 43, 47, 51, 55, 60, 64 }; |
| |
| inline float uint8ToFloat (deUint8 src) |
| { |
| return ((float)src / 255.0f); |
| } |
| |
| inline float int8ToFloat (deInt8 src) |
| { |
| return ((float)src / 128.0f); |
| } |
| |
| inline deUint32 bgr16torgba32 (deUint16 src) |
| { |
| const deUint32 src32 = src; |
| const deUint8 b5 = (src32 & 0x1f); |
| const deUint8 g6 = (src32 >> 5) & 0x3f; |
| const deUint8 r5 = (src32 >> 11) & 0x1f; |
| const deUint32 a8 = 0xff; |
| const deUint32 b8 = extend5To8(b5); |
| const deUint32 g8 = extend6To8(g6); |
| const deUint32 r8 = extend5To8(r5); |
| |
| return (r8 | (g8 <<8) | (b8 << 16) | (a8 << 24)); |
| } |
| |
| // Interpolates color = 1/3 * c0 + 2/3 * c1 |
| inline deUint32 interpolateColor (deUint32 c0, deUint32 c1) |
| { |
| const deUint32 r0 = c0 & 0xff; |
| const deUint32 g0 = (c0 >> 8) & 0xff; |
| const deUint32 b0 = (c0 >> 16) & 0xff; |
| const deUint32 a0 = (c0 >> 24) & 0xff; |
| |
| const deUint32 r1 = c1 & 0xff; |
| const deUint32 g1 = (c1 >> 8) & 0xff; |
| const deUint32 b1 = (c1 >> 16) & 0xff; |
| const deUint32 a1 = (c1 >> 24) & 0xff; |
| |
| const deUint32 r = (r0 + (r1 << 1)) / 3; |
| const deUint32 g = (g0 + (g1 << 1)) / 3; |
| const deUint32 b = (b0 + (b1 << 1)) / 3; |
| const deUint32 a = (a0 + (a1 << 1)) / 3; |
| |
| return (r | (g << 8) | (b << 16) | (a << 24)); |
| } |
| |
| // Average of two colors |
| inline deUint32 averageColor (deUint32 c0, deUint32 c1) |
| { |
| const deUint32 r0 = c0 & 0xff; |
| const deUint32 g0 = (c0 >> 8) & 0xff; |
| const deUint32 b0 = (c0 >> 16) & 0xff; |
| const deUint32 a0 = (c0 >> 24) & 0xff; |
| |
| const deUint32 r1 = c1 & 0xff; |
| const deUint32 g1 = (c1 >> 8) & 0xff; |
| const deUint32 b1 = (c1 >> 16) & 0xff; |
| const deUint32 a1 = (c1 >> 24) & 0xff; |
| |
| const deUint32 r = (r0 + r1) >> 1; |
| const deUint32 g = (g0 + g1) >> 1; |
| const deUint32 b = (b0 + b1) >> 1; |
| const deUint32 a = (a0 + a1) >> 1; |
| |
| return (r | (g << 8) | (b << 16) | (a << 24)); |
| } |
| |
| inline deInt8 extractModeBc6 (deUint8 src) |
| { |
| // Catch illegal modes |
| switch(src & 0x1f) |
| { |
| case 0x13: |
| case 0x17: |
| case 0x1b: |
| case 0x1f: |
| return -1; |
| } |
| |
| switch (src & 0x3) |
| { |
| case 0: return 0; |
| case 1: return 1; |
| case 2: return (deInt8)(2 + ((src >> 2) & 0x7)); |
| case 3: return (deInt8)(10 + ((src >> 2) & 0x7)); |
| } |
| |
| return -1; |
| } |
| |
| inline deInt8 extractModeBc7 (deUint8 src) |
| { |
| for (deInt8 i = 0; i < 8; i++) |
| if (src & (1 << i)) |
| return i; |
| |
| return -1; |
| } |
| |
| inline deUint64 get64BitBlockLE (const deUint8* src, int blockNdx) |
| { |
| // Same as get64BitBlock, but little-endian. |
| deUint64 block = 0; |
| |
| for (int i = 0; i < 8; i++) |
| block |= (deUint64)(src[blockNdx*8+i]) << (8ull*i); |
| |
| return block; |
| } |
| |
| inline deUint32 getBits128 (deUint64 low, deUint64 high, deUint32 first, deUint32 last) |
| { |
| const deUint64 d[2] = { low, high }; |
| const bool reverse = first > last; |
| deUint32 ret = 0; |
| |
| if (reverse) |
| { |
| const deUint32 tmp = first; |
| first = last; |
| last = tmp; |
| } |
| |
| const int elementFirst = first / 64; |
| const int elementLast = last / 64; |
| |
| if (elementFirst == elementLast) |
| { |
| // Bits contained in one of the 64bit elements |
| const deUint32 shift = first % 64; |
| const deUint32 len = last - first + 1; |
| const deUint32 mask = (1 << len) - 1; |
| ret = (deUint32)((d[elementFirst] >> shift) & mask); |
| } |
| else |
| { |
| // Bits contained in both of the 64bit elements |
| DE_ASSERT(last > 63); |
| DE_ASSERT(first < 64); |
| const deUint32 len0 = 64 - first; |
| const deUint32 mask0 = (1 << len0) - 1; |
| const deUint32 data0 = (deUint32)(low >> first) & mask0; |
| const deUint32 len1 = last - 63; |
| const deUint32 mask1 = (1 << len1) - 1; |
| const deUint32 data1 = (deUint32)(high & mask1); |
| ret = (deUint32)((data1 << len0) | data0); |
| } |
| |
| if (reverse) |
| { |
| const deUint32 len = last - first + 1; |
| const deUint32 orig = ret; |
| ret = 0; |
| |
| for (deUint32 i = 0; i < len; i++) |
| { |
| ret |= ((orig >> (len - 1 - i)) & 1) << i; |
| } |
| } |
| |
| return ret; |
| } |
| |
| inline deInt32 signExtend (deInt32 value, deInt32 srcBits, deInt32 dstBits) |
| { |
| deUint32 sign = value & (1 << (srcBits - 1)); |
| |
| if (!sign) return value; |
| |
| deInt32 dstMask = (deInt32)(((deUint64)1 << dstBits) - 1); |
| deInt32 extendedBits = 0xffffffff << srcBits; |
| return (value | extendedBits) & dstMask; |
| } |
| |
| inline deInt32 unquantize (deInt32 x, int mode, bool hasSign) |
| { |
| if (hasSign) |
| { |
| bool s = false; |
| |
| if (epBits[mode] >= 16) return x; |
| |
| if (x < 0) |
| { |
| s = true; |
| x = -x; |
| } |
| |
| if (x == 0) |
| x = 0; |
| else if (x >= (((deInt32)1 << (epBits[mode] - 1)) - 1)) |
| x = 0x7fff; |
| else |
| x = (((deInt32)x << 15) + 0x4000) >> (epBits[mode] - 1); |
| |
| if (s) |
| x = -x; |
| |
| return x; |
| } |
| else |
| { |
| if (epBits[mode] >= 15) |
| return x; |
| else if (x == 0) |
| return 0; |
| else if (x == (((deInt32)1 << epBits[mode]) - 1)) |
| return 0xffff; |
| else |
| return ((((deInt32)x << 15) + 0x4000) >> (epBits[mode] - 1)); |
| } |
| } |
| |
| inline deInt32 interpolate (deInt32 a, deInt32 b, deUint32 index, deUint32 indexPrecision) |
| { |
| const deUint16* weights[] = {weights2, weights3, weights4}; |
| const deUint16* weight = weights[indexPrecision-2]; |
| DE_ASSERT(indexPrecision >= 2 && indexPrecision <= 4); |
| |
| return (((64 - weight[index]) * a + weight[index] * b + 32) >> 6); |
| } |
| |
| inline deInt16 finishUnquantize (deInt32 x, bool hasSign) |
| { |
| if (hasSign) |
| { |
| if (x < 0) |
| x = -(((-x) * 31) >> 5); |
| else |
| x = (x * 31) >> 5; |
| |
| if (x < 0) |
| x = (-x) | 0x8000; |
| } |
| else |
| { |
| x = (x * 31) / 64; |
| } |
| |
| return (deInt16)x; |
| } |
| |
| } // BcDecompressInternal |
| |
| void decompressBc1 (const PixelBufferAccess& dst, const deUint8* src, bool hasAlpha) |
| { |
| using namespace BcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const deUint32 dstRowPitch = dst.getRowPitch(); |
| const deUint32 dstPixelSize = 4; |
| const deUint16 color0_16 = ((deUint16*)src)[0]; |
| const deUint16 color1_16 = ((deUint16*)src)[1]; |
| const deUint32 color0 = bgr16torgba32(color0_16); |
| const deUint32 color1 = bgr16torgba32(color1_16); |
| const deUint8* const indices8 = &src[4]; |
| |
| const bool alphaMode = color1_16 > color0_16; |
| |
| const deInt32 indices[16] = |
| { |
| (indices8[0] >> 0) & 0x3, |
| (indices8[0] >> 2) & 0x3, |
| (indices8[0] >> 4) & 0x3, |
| (indices8[0] >> 6) & 0x3, |
| (indices8[1] >> 0) & 0x3, |
| (indices8[1] >> 2) & 0x3, |
| (indices8[1] >> 4) & 0x3, |
| (indices8[1] >> 6) & 0x3, |
| (indices8[2] >> 0) & 0x3, |
| (indices8[2] >> 2) & 0x3, |
| (indices8[2] >> 4) & 0x3, |
| (indices8[2] >> 6) & 0x3, |
| (indices8[3] >> 0) & 0x3, |
| (indices8[3] >> 2) & 0x3, |
| (indices8[3] >> 4) & 0x3, |
| (indices8[3] >> 6) & 0x3 |
| }; |
| |
| const deUint32 colors[4] = |
| { |
| color0, |
| color1, |
| alphaMode ? averageColor(color0, color1) : interpolateColor(color1, color0), |
| alphaMode ? (hasAlpha ? 0 : 0xff000000) : interpolateColor(color0, color1) |
| }; |
| |
| for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) |
| { |
| for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) |
| { |
| deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize); |
| *dstPixel = colors[indices[y * BC_BLOCK_WIDTH + x]]; |
| } |
| } |
| } |
| |
| void decompressBc2 (const PixelBufferAccess& dst, const deUint8* src) |
| { |
| using namespace BcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const deUint32 dstRowPitch = dst.getRowPitch(); |
| const deUint32 dstPixelSize = 4; |
| const deUint16 color0_16 = ((deUint16*)src)[4]; |
| const deUint16 color1_16 = ((deUint16*)src)[5]; |
| const deUint32 color0 = bgr16torgba32(color0_16); |
| const deUint32 color1 = bgr16torgba32(color1_16); |
| const deUint8* const indices8 = &src[12]; |
| const deUint8* const alphas8 = src; |
| |
| const deInt32 indices[16] = |
| { |
| (indices8[0] >> 0) & 0x3, |
| (indices8[0] >> 2) & 0x3, |
| (indices8[0] >> 4) & 0x3, |
| (indices8[0] >> 6) & 0x3, |
| (indices8[1] >> 0) & 0x3, |
| (indices8[1] >> 2) & 0x3, |
| (indices8[1] >> 4) & 0x3, |
| (indices8[1] >> 6) & 0x3, |
| (indices8[2] >> 0) & 0x3, |
| (indices8[2] >> 2) & 0x3, |
| (indices8[2] >> 4) & 0x3, |
| (indices8[2] >> 6) & 0x3, |
| (indices8[3] >> 0) & 0x3, |
| (indices8[3] >> 2) & 0x3, |
| (indices8[3] >> 4) & 0x3, |
| (indices8[3] >> 6) & 0x3 |
| }; |
| |
| const deInt32 alphas[16] = |
| { |
| extend4To8(((alphas8[0] >> 0) & 0xf)) << 24, |
| extend4To8(((alphas8[0] >> 4) & 0xf)) << 24, |
| extend4To8(((alphas8[1] >> 0) & 0xf)) << 24, |
| extend4To8(((alphas8[1] >> 4) & 0xf)) << 24, |
| extend4To8(((alphas8[2] >> 0) & 0xf)) << 24, |
| extend4To8(((alphas8[2] >> 4) & 0xf)) << 24, |
| extend4To8(((alphas8[3] >> 0) & 0xf)) << 24, |
| extend4To8(((alphas8[3] >> 4) & 0xf)) << 24, |
| extend4To8(((alphas8[4] >> 0) & 0xf)) << 24, |
| extend4To8(((alphas8[4] >> 4) & 0xf)) << 24, |
| extend4To8(((alphas8[5] >> 0) & 0xf)) << 24, |
| extend4To8(((alphas8[5] >> 4) & 0xf)) << 24, |
| extend4To8(((alphas8[6] >> 0) & 0xf)) << 24, |
| extend4To8(((alphas8[6] >> 4) & 0xf)) << 24, |
| extend4To8(((alphas8[7] >> 0) & 0xf)) << 24, |
| extend4To8(((alphas8[7] >> 4) & 0xf)) << 24 |
| }; |
| |
| const deUint32 colors[4] = |
| { |
| color0, |
| color1, |
| interpolateColor(color1, color0), |
| interpolateColor(color0, color1) |
| }; |
| |
| for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) |
| { |
| for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) |
| { |
| deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize); |
| *dstPixel = (colors[indices[y * BC_BLOCK_WIDTH + x]] & 0x00ffffff) | alphas[y * BC_BLOCK_WIDTH + x]; |
| } |
| } |
| } |
| |
| void decompressBc3 (const PixelBufferAccess& dst, const deUint8* src) |
| { |
| using namespace BcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const deUint32 dstRowPitch = dst.getRowPitch(); |
| const deUint32 dstPixelSize = 4; |
| const deUint8 alpha0 = src[0]; |
| const deUint8 alpha1 = src[1]; |
| const deUint16 color0_16 = ((deUint16*)src)[4]; |
| const deUint16 color1_16 = ((deUint16*)src)[5]; |
| const deUint32 color0 = bgr16torgba32(color0_16); |
| const deUint32 color1 = bgr16torgba32(color1_16); |
| const deUint8* const indices8 = &src[12]; |
| const deUint64 alphaBits = get64BitBlockLE(src, 0) >> 16; |
| deUint32 alphas[8]; |
| |
| const deInt32 indices[16] = |
| { |
| (indices8[0] >> 0) & 0x3, |
| (indices8[0] >> 2) & 0x3, |
| (indices8[0] >> 4) & 0x3, |
| (indices8[0] >> 6) & 0x3, |
| (indices8[1] >> 0) & 0x3, |
| (indices8[1] >> 2) & 0x3, |
| (indices8[1] >> 4) & 0x3, |
| (indices8[1] >> 6) & 0x3, |
| (indices8[2] >> 0) & 0x3, |
| (indices8[2] >> 2) & 0x3, |
| (indices8[2] >> 4) & 0x3, |
| (indices8[2] >> 6) & 0x3, |
| (indices8[3] >> 0) & 0x3, |
| (indices8[3] >> 2) & 0x3, |
| (indices8[3] >> 4) & 0x3, |
| (indices8[3] >> 6) & 0x3 |
| }; |
| |
| const deInt32 alphaIndices[16] = |
| { |
| (deInt32)((alphaBits >> 0) & 0x7), |
| (deInt32)((alphaBits >> 3) & 0x7), |
| (deInt32)((alphaBits >> 6) & 0x7), |
| (deInt32)((alphaBits >> 9) & 0x7), |
| (deInt32)((alphaBits >> 12) & 0x7), |
| (deInt32)((alphaBits >> 15) & 0x7), |
| (deInt32)((alphaBits >> 18) & 0x7), |
| (deInt32)((alphaBits >> 21) & 0x7), |
| (deInt32)((alphaBits >> 24) & 0x7), |
| (deInt32)((alphaBits >> 27) & 0x7), |
| (deInt32)((alphaBits >> 30) & 0x7), |
| (deInt32)((alphaBits >> 33) & 0x7), |
| (deInt32)((alphaBits >> 36) & 0x7), |
| (deInt32)((alphaBits >> 39) & 0x7), |
| (deInt32)((alphaBits >> 42) & 0x7), |
| (deInt32)((alphaBits >> 45) & 0x7) |
| }; |
| |
| const deUint32 colors[4] = |
| { |
| color0, |
| color1, |
| interpolateColor(color1, color0), |
| interpolateColor(color0, color1) |
| }; |
| |
| alphas[0] = alpha0 << 24; |
| alphas[1] = alpha1 << 24; |
| |
| if (alpha0 > alpha1) |
| { |
| for (deUint32 i = 0; i < 6; i++) |
| alphas[i + 2] = (((deUint32)alpha0 * (6 - i) + (deUint32)alpha1 * (1 + i)) / 7) << 24; |
| } |
| else |
| { |
| for (deUint32 i = 0; i < 4; i++) |
| alphas[i + 2] = (((deUint32)alpha0 * (4 - i) + (deUint32)alpha1 * (1 + i)) / 5) << 24; |
| alphas[6] = 0; |
| alphas[7] = 0xff000000; |
| } |
| |
| for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) |
| { |
| for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) |
| { |
| deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize); |
| *dstPixel = (colors[indices[y * BC_BLOCK_WIDTH + x]] & 0x00ffffff) | alphas[alphaIndices[y * BC_BLOCK_WIDTH + x]]; |
| } |
| } |
| } |
| |
| void decompressBc4 (const PixelBufferAccess& dst, const deUint8* src, bool hasSign) |
| { |
| using namespace BcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const deUint32 dstRowPitch = dst.getRowPitch(); |
| const deUint32 dstPixelSize = 4; |
| const deUint8 red0 = src[0]; |
| const deUint8 red1 = src[1]; |
| const deInt8 red0s = ((deInt8*)src)[0]; |
| const deInt8 red1s = ((deInt8*)src)[1]; |
| const deUint64 indexBits = get64BitBlockLE(src, 0) >> 16; |
| float reds[8]; |
| |
| const deInt32 indices[16] = |
| { |
| (deInt32)((indexBits >> 0) & 0x7), |
| (deInt32)((indexBits >> 3) & 0x7), |
| (deInt32)((indexBits >> 6) & 0x7), |
| (deInt32)((indexBits >> 9) & 0x7), |
| (deInt32)((indexBits >> 12) & 0x7), |
| (deInt32)((indexBits >> 15) & 0x7), |
| (deInt32)((indexBits >> 18) & 0x7), |
| (deInt32)((indexBits >> 21) & 0x7), |
| (deInt32)((indexBits >> 24) & 0x7), |
| (deInt32)((indexBits >> 27) & 0x7), |
| (deInt32)((indexBits >> 30) & 0x7), |
| (deInt32)((indexBits >> 33) & 0x7), |
| (deInt32)((indexBits >> 36) & 0x7), |
| (deInt32)((indexBits >> 39) & 0x7), |
| (deInt32)((indexBits >> 42) & 0x7), |
| (deInt32)((indexBits >> 45) & 0x7) |
| }; |
| |
| reds[0] = hasSign ? int8ToFloat(red0s) : uint8ToFloat(red0); |
| reds[1] = hasSign ? int8ToFloat(red1s) : uint8ToFloat(red1); |
| |
| if (reds[0] > reds[1]) |
| { |
| for (deUint32 i = 0; i < 6; i++) |
| reds[i + 2] = (reds[0] * (6.0f - (float)i) + reds[1] * (1.0f + (float)i)) / 7.0f; |
| } |
| else |
| { |
| for (deUint32 i = 0; i < 4; i++) |
| reds[i + 2] = (reds[0] * (4.0f - (float)i) + reds[1] * (1.0f + (float)i)) / 5.0f; |
| reds[6] = hasSign ? -1.0f : 0.0f; |
| reds[7] = 1.0f; |
| } |
| |
| for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) |
| { |
| for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) |
| { |
| float* const dstPixel = (float*)(dstPtr + y * dstRowPitch + x * dstPixelSize); |
| *dstPixel = reds[indices[y * BC_BLOCK_WIDTH + x]]; |
| } |
| } |
| } |
| |
| void decompressBc5 (const PixelBufferAccess& dst, const deUint8* src, bool hasSign) |
| { |
| using namespace BcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const deUint32 dstRowPitch = dst.getRowPitch(); |
| const deUint32 dstPixelSize = 8; |
| float rg[2][8]; |
| deUint32 indices[2][16]; |
| |
| for (deUint32 c = 0; c < 2; c++) |
| { |
| const deUint32 offset = c * 8; |
| const deUint8 rg0 = src[offset]; |
| const deUint8 rg1 = src[offset + 1]; |
| const deInt8 rg0s = ((deInt8*)src)[offset]; |
| const deInt8 rg1s = ((deInt8*)src)[offset + 1]; |
| const deUint64 indexBits = get64BitBlockLE(src, c) >> 16; |
| |
| for (deUint32 i = 0; i < 16; i++) |
| indices[c][i] = (indexBits >> (i * 3)) & 0x7; |
| |
| rg[c][0] = hasSign ? int8ToFloat(rg0s) : uint8ToFloat(rg0); |
| rg[c][1] = hasSign ? int8ToFloat(rg1s) : uint8ToFloat(rg1); |
| |
| if (rg[c][0] > rg[c][1]) |
| { |
| for (deUint32 i = 0; i < 6; i++) |
| rg[c][i + 2] = (rg[c][0] * (6.0f - (float)i) + rg[c][1] * (1.0f + (float)i)) / 7.0f; |
| } |
| else |
| { |
| for (deUint32 i = 0; i < 4; i++) |
| rg[c][i + 2] = (rg[c][0] * (4.0f - (float)i) + rg[c][1] * (1.0f + (float)i)) / 5.0f; |
| rg[c][6] = hasSign ? -1.0f : 0.0f; |
| rg[c][7] = 1.0f; |
| } |
| } |
| |
| for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++) |
| { |
| for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++) |
| { |
| float* const dstPixel = (float*)(dstPtr + y * dstRowPitch + x * dstPixelSize); |
| for (deUint32 i = 0; i < 2; i++) |
| dstPixel[i] = rg[i][indices[i][y * BC_BLOCK_WIDTH + x]]; |
| } |
| } |
| } |
| |
| void decompressBc6H (const PixelBufferAccess& dst, const deUint8* src, bool hasSign) |
| { |
| using namespace BcDecompressInternal; |
| |
| deUint8* const dstPtr = (deUint8*)dst.getDataPtr(); |
| const deUint32 dstRowPitch = dst.getRowPitch(); |
| const deUint32 dstPixelSize = 6; |
| |
| deInt32 mode = extractModeBc6(src[0]); |
| IVec4 r (0); |
| IVec4 g (0); |
| IVec4 b (0); |
| deUint32 deltaBitsR = 0; |
| deUint32 deltaBitsG = 0; |
| deUint32 deltaBitsB = 0; |
| const deUint64 low = ((deUint64*)src)[0]; |
| const deUint64 high = ((deUint64*)src)[1]; |
| const deUint32 d = mode < 10 ? getBits128(low, high, 77, 81) : 0; |
| const deUint32 numRegions = mode > 9 ? 1 : 2; |
| const deUint32 numEndpoints = numRegions * 2; |
| const bool transformed = mode != 9 && mode != 10; |
| const deUint32 colorIndexBC = mode < 10 ? 3 : 4; |
| deUint64 colorIndexData = high >> (mode < 10 ? 18 : 1); |
| const deUint32 anchorIndex[2] = { 0, anchorIndicesSecondSubset2[d] }; |
| |
| switch (mode) |
| { |
| case 0: |
| g[2] |= getBits128(low, high, 2, 2) << 4; |
| b[2] |= getBits128(low, high, 3, 3) << 4; |
| b[3] |= getBits128(low, high, 4, 4) << 4; |
| r[0] |= getBits128(low, high, 5, 14); |
| g[0] |= getBits128(low, high, 15, 24); |
| b[0] |= getBits128(low, high, 25, 34); |
| r[1] |= getBits128(low, high, 35, 39); |
| g[3] |= getBits128(low, high, 40, 40) << 4; |
| g[2] |= getBits128(low, high, 41, 44); |
| g[1] |= getBits128(low, high, 45, 49); |
| b[3] |= getBits128(low, high, 50, 50); |
| g[3] |= getBits128(low, high, 51, 54); |
| b[1] |= getBits128(low, high, 55, 59); |
| b[3] |= getBits128(low, high, 60, 60) << 1; |
| b[2] |= getBits128(low, high, 61, 64); |
| r[2] |= getBits128(low, high, 65, 69); |
| b[3] |= getBits128(low, high, 70, 70) << 2; |
| r[3] |= getBits128(low, high, 71, 75); |
| b[3] |= getBits128(low, high, 76, 76) << 3; |
| deltaBitsR = deltaBitsG = deltaBitsB = 5; |
| break; |
| |
| case 1: |
| g[2] |= getBits128(low, high, 2, 2) << 5; |
| g[3] |= getBits128(low, high, 3, 3) << 4; |
| g[3] |= getBits128(low, high, 4, 4) << 5; |
| r[0] |= getBits128(low, high, 5, 11); |
| b[3] |= getBits128(low, high, 12, 12); |
| b[3] |= getBits128(low, high, 13, 13) << 1; |
| b[2] |= getBits128(low, high, 14, 14) << 4; |
| g[0] |= getBits128(low, high, 15, 21); |
| b[2] |= getBits128(low, high, 22, 22) << 5; |
| b[3] |= getBits128(low, high, 23, 23) << 2; |
| g[2] |= getBits128(low, high, 24, 24) << 4; |
| b[0] |= getBits128(low, high, 25, 31); |
| b[3] |= getBits128(low, high, 32, 32) << 3; |
| b[3] |= getBits128(low, high, 33, 33) << 5; |
| b[3] |= getBits128(low, high, 34, 34) << 4; |
| r[1] |= getBits128(low, high, 35, 40); |
| g[2] |= getBits128(low, high, 41, 44); |
| g[1] |= getBits128(low, high, 45, 50); |
| g[3] |= getBits128(low, high, 51, 54); |
| b[1] |= getBits128(low, high, 55, 60); |
| b[2] |= getBits128(low, high, 61, 64); |
| r[2] |= getBits128(low, high, 65, 70); |
| r[3] |= getBits128(low, high, 71, 76); |
| deltaBitsR = deltaBitsG = deltaBitsB = 6; |
| break; |
| |
| case 2: |
| r[0] |= getBits128(low, high, 5, 14); |
| g[0] |= getBits128(low, high, 15, 24); |
| b[0] |= getBits128(low, high, 25, 34); |
| r[1] |= getBits128(low, high, 35, 39); |
| r[0] |= getBits128(low, high, 40, 40) << 10; |
| g[2] |= getBits128(low, high, 41, 44); |
| g[1] |= getBits128(low, high, 45, 48); |
| g[0] |= getBits128(low, high, 49, 49) << 10; |
| b[3] |= getBits128(low, high, 50, 50); |
| g[3] |= getBits128(low, high, 51, 54); |
| b[1] |= getBits128(low, high, 55, 58); |
| b[0] |= getBits128(low, high, 59, 59) << 10; |
| b[3] |= getBits128(low, high, 60, 60) << 1; |
| b[2] |= getBits128(low, high, 61, 64); |
| r[2] |= getBits128(low, high, 65, 69); |
| b[3] |= getBits128(low, high, 70, 70) << 2; |
| r[3] |= getBits128(low, high, 71, 75); |
| b[3] |= getBits128(low, high, 76, 76) << 3; |
| deltaBitsR = 5; |
| deltaBitsG = deltaBitsB = 4; |
| break; |
| |
| case 3: |
| r[0] |= getBits128(low, high, 5, 14); |
| g[0] |= getBits128(low, high, 15, 24); |
| b[0] |= getBits128(low, high, 25, 34); |
| r[1] |= getBits128(low, high, 35, 38); |
| r[0] |= getBits128(low, high, 39, 39) << 10; |
| g[3] |= getBits128(low, high, 40, 40) << 4; |
| g[2] |= getBits128(low, high, 41, 44); |
| g[1] |= getBits128(low, high, 45, 49); |
| g[0] |= getBits128(low, high, 50, 50) << 10; |
| g[3] |= getBits128(low, high, 51, 54); |
| b[1] |= getBits128(low, high, 55, 58); |
| b[0] |= getBits128(low, high, 59, 59) << 10; |
| b[3] |= getBits128(low, high, 60, 60) << 1; |
| b[2] |= getBits128(low, high, 61, 64); |
| r[2] |= getBits128(low, high, 65, 68); |
| b[3] |= getBits128(low, high, 69, 69); |
| b[3] |= getBits128(low, high, 70, 70) << 2; |
| r[3] |= getBits128(low, high, 71, 74); |
| g[2] |= getBits128(low, high, 75, 75) << 4; |
| b[3] |= getBits128(low, high, 76, 76) << 3; |
| deltaBitsR = deltaBitsB = 4; |
| deltaBitsG = 5; |
| break; |
| |
| case 4: |
| r[0] |= getBits128(low, high, 5, 14); |
| g[0] |= getBits128(low, high, 15, 24); |
| b[0] |= getBits128(low, high, 25, 34); |
| r[1] |= getBits128(low, high, 35, 38); |
| r[0] |= getBits128(low, high, 39, 39) << 10; |
| b[2] |= getBits128(low, high, 40, 40) << 4; |
| g[2] |= getBits128(low, high, 41, 44); |
| g[1] |= getBits128(low, high, 45, 48); |
| g[0] |= getBits128(low, high, 49, 49) << 10; |
| b[3] |= getBits128(low, high, 50, 50); |
| g[3] |= getBits128(low, high, 51, 54); |
| b[1] |= getBits128(low, high, 55, 59); |
| b[0] |= getBits128(low, high, 60, 60) << 10; |
| b[2] |= getBits128(low, high, 61, 64); |
| r[2] |= getBits128(low, high, 65, 68); |
| b[3] |= getBits128(low, high, 69, 69) << 1; |
| b[3] |= getBits128(low, high, 70, 70) << 2; |
| r[3] |= getBits128(low, high, 71, 74);
|