return -1;
}
}
+ else if (isBcFormat(format))
+ {
+ switch (format)
+ {
+ case COMPRESSEDTEXFORMAT_BC1_RGB_UNORM_BLOCK: return 8;
+ case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK: return 8;
+ case COMPRESSEDTEXFORMAT_BC1_RGBA_UNORM_BLOCK: return 8;
+ case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK: return 8;
+ case COMPRESSEDTEXFORMAT_BC2_UNORM_BLOCK: return 16;
+ case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK: return 16;
+ case COMPRESSEDTEXFORMAT_BC3_UNORM_BLOCK: return 16;
+ case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK: return 16;
+ case COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK: return 8;
+ case COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK: return 8;
+ case COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK: return 16;
+ case COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK: return 16;
+ case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK: return 16;
+ case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK: return 16;
+ case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK: return 16;
+ case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: return 16;
+
+ default:
+ DE_ASSERT(false);
+ return -1;
+ }
+ }
else
{
DE_ASSERT(false);
return IVec3();
}
}
+ else if (isBcFormat(format))
+ {
+ return IVec3(4, 4, 1);
+ }
else
{
DE_ASSERT(false);
}
}
+bool isBcFormat (CompressedTexFormat format)
+{
+ switch (format)
+ {
+ case COMPRESSEDTEXFORMAT_BC1_RGB_UNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC1_RGBA_UNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC2_UNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC3_UNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK:
+ return true;
+
+ default:
+ return false;
+ }
+}
+
+bool isBcBitExactFormat (CompressedTexFormat format)
+{
+ switch (format)
+ {
+ case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK:
+ return true;
+
+ default:
+ return false;
+ }
+}
+
+bool isBcSRGBFormat (CompressedTexFormat format)
+{
+ switch (format)
+ {
+ case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK:
+ case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK:
+ return true;
+
+ default:
+ return false;
+ }
+}
+
bool isAstcFormat (CompressedTexFormat format)
{
switch (format)
else
return TextureFormat(TextureFormat::RGBA, TextureFormat::HALF_FLOAT);
}
+ else if (isBcFormat(format))
+ {
+ if (format == COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK || format == COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK)
+ return TextureFormat(TextureFormat::R, TextureFormat::FLOAT);
+ else if (format == COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK || format == COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK)
+ return TextureFormat(TextureFormat::RG, TextureFormat::FLOAT);
+ else if (format == COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK || format == COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK)
+ return TextureFormat(TextureFormat::RGB, TextureFormat::HALF_FLOAT);
+ else if (isBcSRGBFormat(format))
+ return TextureFormat(TextureFormat::sRGBA, TextureFormat::UNORM_INT8);
+ else
+ return TextureFormat(TextureFormat::RGBA, TextureFormat::UNORM_INT8);
+ }
else
{
DE_ASSERT(false);
namespace
{
+inline deUint8 extend4To8 (deUint8 src)
+{
+ DE_ASSERT((src & ~((1<<4)-1)) == 0);
+ return (deUint8)((src << 4) | src);
+}
+
+inline deUint8 extend5To8 (deUint8 src)
+{
+ DE_ASSERT((src & ~((1<<5)-1)) == 0);
+ return (deUint8)((src << 3) | (src >> 2));
+}
+
+inline deUint8 extend6To8 (deUint8 src)
+{
+ DE_ASSERT((src & ~((1<<6)-1)) == 0);
+ return (deUint8)((src << 2) | (src >> 4));
+}
+
// \todo [2013-08-06 nuutti] ETC and ASTC decompression codes are rather unrelated, and are already in their own "private" namespaces - should this be split to multiple files?
namespace EtcDecompressInternal
return (deUint32)((src >> low) & 0xFFFFFFFFu);
}
-inline deUint8 extend4To8 (deUint8 src)
-{
- DE_ASSERT((src & ~((1<<4)-1)) == 0);
- return (deUint8)((src << 4) | src);
-}
-
-inline deUint8 extend5To8 (deUint8 src)
-{
- DE_ASSERT((src & ~((1<<5)-1)) == 0);
- return (deUint8)((src << 3) | (src >> 2));
-}
-
-inline deUint8 extend6To8 (deUint8 src)
-{
- DE_ASSERT((src & ~((1<<6)-1)) == 0);
- return (deUint8)((src << 2) | (src >> 4));
-}
-
inline deUint8 extend7To8 (deUint8 src)
{
DE_ASSERT((src & ~((1<<7)-1)) == 0);
}
}
+namespace BcDecompressInternal
+{
+
+enum
+{
+ BC_BLOCK_WIDTH = 4,
+ BC_BLOCK_HEIGHT = 4
+};
+
+static const deUint8 epBits[14] = { 10, 7, 11, 11, 11, 9, 8, 8, 8, 6, 10, 11, 12, 16 };
+
+static const deUint8 partitions2[64][16] =
+{
+ { 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1 },
+ { 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1 },
+ { 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1 },
+ { 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1 },
+ { 0, 0, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1 },
+ { 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1 },
+ { 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1 },
+ { 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1 },
+ { 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1 },
+ { 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1 },
+ { 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0 },
+ { 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0 },
+ { 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0 },
+ { 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0 },
+ { 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1 },
+ { 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0 },
+ { 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0 },
+ { 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0 },
+ { 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0 },
+ { 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0 },
+ { 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0 },
+ { 0, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0 },
+ { 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0 },
+ { 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1 },
+ { 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1 },
+ { 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0 },
+ { 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0 },
+ { 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0 },
+ { 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0 },
+ { 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1 },
+ { 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1 },
+ { 0, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0 },
+ { 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0 },
+ { 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0 },
+ { 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0 },
+ { 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0 },
+ { 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1 },
+ { 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1 },
+ { 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0 },
+ { 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0 },
+ { 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0 },
+ { 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0 },
+ { 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0 },
+ { 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1 },
+ { 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1 },
+ { 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0 },
+ { 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 0 },
+ { 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1 },
+ { 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1 },
+ { 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1 },
+ { 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1 },
+ { 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1 },
+ { 0, 0, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0 },
+ { 0, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0 },
+ { 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 1, 1 }
+};
+
+static const deUint8 partitions3[64][16] =
+{
+ { 0, 0, 1, 1, 0, 0, 1, 1, 0, 2, 2, 1, 2, 2, 2, 2 },
+ { 0, 0, 0, 1, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2, 2, 1 },
+ { 0, 0, 0, 0, 2, 0, 0, 1, 2, 2, 1, 1, 2, 2, 1, 1 },
+ { 0, 2, 2, 2, 0, 0, 2, 2, 0, 0, 1, 1, 0, 1, 1, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2 },
+ { 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 2, 2, 0, 0, 2, 2 },
+ { 0, 0, 2, 2, 0, 0, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1 },
+ { 0, 0, 1, 1, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2, 1, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2 },
+ { 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2 },
+ { 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2 },
+ { 0, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2 },
+ { 0, 1, 1, 2, 0, 1, 1, 2, 0, 1, 1, 2, 0, 1, 1, 2 },
+ { 0, 1, 2, 2, 0, 1, 2, 2, 0, 1, 2, 2, 0, 1, 2, 2 },
+ { 0, 0, 1, 1, 0, 1, 1, 2, 1, 1, 2, 2, 1, 2, 2, 2 },
+ { 0, 0, 1, 1, 2, 0, 0, 1, 2, 2, 0, 0, 2, 2, 2, 0 },
+ { 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 1, 2, 1, 1, 2, 2 },
+ { 0, 1, 1, 1, 0, 0, 1, 1, 2, 0, 0, 1, 2, 2, 0, 0 },
+ { 0, 0, 0, 0, 1, 1, 2, 2, 1, 1, 2, 2, 1, 1, 2, 2 },
+ { 0, 0, 2, 2, 0, 0, 2, 2, 0, 0, 2, 2, 1, 1, 1, 1 },
+ { 0, 1, 1, 1, 0, 1, 1, 1, 0, 2, 2, 2, 0, 2, 2, 2 },
+ { 0, 0, 0, 1, 0, 0, 0, 1, 2, 2, 2, 1, 2, 2, 2, 1 },
+ { 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 2, 2, 0, 1, 2, 2 },
+ { 0, 0, 0, 0, 1, 1, 0, 0, 2, 2, 1, 0, 2, 2, 1, 0 },
+ { 0, 1, 2, 2, 0, 1, 2, 2, 0, 0, 1, 1, 0, 0, 0, 0 },
+ { 0, 0, 1, 2, 0, 0, 1, 2, 1, 1, 2, 2, 2, 2, 2, 2 },
+ { 0, 1, 1, 0, 1, 2, 2, 1, 1, 2, 2, 1, 0, 1, 1, 0 },
+ { 0, 0, 0, 0, 0, 1, 1, 0, 1, 2, 2, 1, 1, 2, 2, 1 },
+ { 0, 0, 2, 2, 1, 1, 0, 2, 1, 1, 0, 2, 0, 0, 2, 2 },
+ { 0, 1, 1, 0, 0, 1, 1, 0, 2, 0, 0, 2, 2, 2, 2, 2 },
+ { 0, 0, 1, 1, 0, 1, 2, 2, 0, 1, 2, 2, 0, 0, 1, 1 },
+ { 0, 0, 0, 0, 2, 0, 0, 0, 2, 2, 1, 1, 2, 2, 2, 1 },
+ { 0, 0, 0, 0, 0, 0, 0, 2, 1, 1, 2, 2, 1, 2, 2, 2 },
+ { 0, 2, 2, 2, 0, 0, 2, 2, 0, 0, 1, 2, 0, 0, 1, 1 },
+ { 0, 0, 1, 1, 0, 0, 1, 2, 0, 0, 2, 2, 0, 2, 2, 2 },
+ { 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2, 0, 0, 1, 2, 0 },
+ { 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 0, 0, 0, 0 },
+ { 0, 1, 2, 0, 1, 2, 0, 1, 2, 0, 1, 2, 0, 1, 2, 0 },
+ { 0, 1, 2, 0, 2, 0, 1, 2, 1, 2, 0, 1, 0, 1, 2, 0 },
+ { 0, 0, 1, 1, 2, 2, 0, 0, 1, 1, 2, 2, 0, 0, 1, 1 },
+ { 0, 0, 1, 1, 1, 1, 2, 2, 2, 2, 0, 0, 0, 0, 1, 1 },
+ { 0, 1, 0, 1, 0, 1, 0, 1, 2, 2, 2, 2, 2, 2, 2, 2 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 2, 1, 2, 1, 2, 1 },
+ { 0, 0, 2, 2, 1, 1, 2, 2, 0, 0, 2, 2, 1, 1, 2, 2 },
+ { 0, 0, 2, 2, 0, 0, 1, 1, 0, 0, 2, 2, 0, 0, 1, 1 },
+ { 0, 2, 2, 0, 1, 2, 2, 1, 0, 2, 2, 0, 1, 2, 2, 1 },
+ { 0, 1, 0, 1, 2, 2, 2, 2, 2, 2, 2, 2, 0, 1, 0, 1 },
+ { 0, 0, 0, 0, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1 },
+ { 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 2, 2, 2, 2 },
+ { 0, 2, 2, 2, 0, 1, 1, 1, 0, 2, 2, 2, 0, 1, 1, 1 },
+ { 0, 0, 0, 2, 1, 1, 1, 2, 0, 0, 0, 2, 1, 1, 1, 2 },
+ { 0, 0, 0, 0, 2, 1, 1, 2, 2, 1, 1, 2, 2, 1, 1, 2 },
+ { 0, 2, 2, 2, 0, 1, 1, 1, 0, 1, 1, 1, 0, 2, 2, 2 },
+ { 0, 0, 0, 2, 1, 1, 1, 2, 1, 1, 1, 2, 0, 0, 0, 2 },
+ { 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 2, 2, 2, 2 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 1, 2, 2, 1, 1, 2 },
+ { 0, 1, 1, 0, 0, 1, 1, 0, 2, 2, 2, 2, 2, 2, 2, 2 },
+ { 0, 0, 2, 2, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 2, 2 },
+ { 0, 0, 2, 2, 1, 1, 2, 2, 1, 1, 2, 2, 0, 0, 2, 2 },
+ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 1, 1, 2 },
+ { 0, 0, 0, 2, 0, 0, 0, 1, 0, 0, 0, 2, 0, 0, 0, 1 },
+ { 0, 2, 2, 2, 1, 2, 2, 2, 0, 2, 2, 2, 1, 2, 2, 2 },
+ { 0, 1, 0, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2 },
+ { 0, 1, 1, 1, 2, 0, 1, 1, 2, 2, 0, 1, 2, 2, 2, 0 }
+};
+
+static const deUint8 anchorIndicesSecondSubset2[64] = { 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 2, 8, 2, 2, 8, 8, 15, 2, 8, 2, 2, 8, 8, 2, 2,
+ 15, 15, 6, 8, 2, 8, 15, 15, 2, 8, 2, 2, 2, 15, 15, 6, 6, 2, 6, 8, 15, 15, 2, 2, 15, 15, 15, 15, 15, 2, 2, 15 };
+
+static const deUint8 anchorIndicesSecondSubset3[64] = { 3, 3, 15, 15, 8, 3, 15, 15, 8, 8, 6, 6, 6, 5, 3, 3, 3, 3, 8, 15, 3, 3, 6, 10, 5, 8, 8, 6, 8, 5, 15, 15,
+ 8, 15, 3, 5, 6, 10, 8, 15, 15, 3, 15, 5, 15, 15, 15, 15, 3, 15, 5, 5, 5, 8, 5, 10, 5, 10, 8, 13, 15, 12, 3, 3 };
+
+static const deUint8 anchorIndicesThirdSubset[64] = { 15, 8, 8, 3, 15, 15, 3, 8, 15, 15, 15, 15, 15, 15, 15, 8, 15, 8, 15, 3, 15, 8, 15, 8, 3, 15, 6, 10, 15, 15, 10, 8,
+ 15, 3, 15, 10, 10, 8, 9, 10, 6, 15, 8, 15, 3, 6, 6, 8, 15, 3, 15, 15, 15, 15, 15, 15, 15, 15, 15, 15, 3, 15, 15, 8 };
+
+static const deUint16 weights2[4] = { 0, 21, 43, 64 };
+static const deUint16 weights3[8] = { 0, 9, 18, 27, 37, 46, 55, 64 };
+static const deUint16 weights4[16] = { 0, 4, 9, 13, 17, 21, 26, 30, 34, 38, 43, 47, 51, 55, 60, 64 };
+
+inline float uint8ToFloat (deUint8 src)
+{
+ return ((float)src / 255.0f);
+}
+
+inline float int8ToFloat (deInt8 src)
+{
+ return ((float)src / 128.0f);
+}
+
+inline deUint32 bgr16torgba32 (deUint16 src)
+{
+ const deUint32 src32 = src;
+ const deUint8 b5 = (src32 & 0x1f);
+ const deUint8 g6 = (src32 >> 5) & 0x3f;
+ const deUint8 r5 = (src32 >> 11) & 0x1f;
+ const deUint32 a8 = 0xff;
+ const deUint32 b8 = extend5To8(b5);
+ const deUint32 g8 = extend6To8(g6);
+ const deUint32 r8 = extend5To8(r5);
+
+ return (r8 | (g8 <<8) | (b8 << 16) | (a8 << 24));
+}
+
+// Interpolates color = 1/3 * c0 + 2/3 * c1
+inline deUint32 interpolateColor (deUint32 c0, deUint32 c1)
+{
+ const deUint32 r0 = c0 & 0xff;
+ const deUint32 g0 = (c0 >> 8) & 0xff;
+ const deUint32 b0 = (c0 >> 16) & 0xff;
+ const deUint32 a0 = (c0 >> 24) & 0xff;
+
+ const deUint32 r1 = c1 & 0xff;
+ const deUint32 g1 = (c1 >> 8) & 0xff;
+ const deUint32 b1 = (c1 >> 16) & 0xff;
+ const deUint32 a1 = (c1 >> 24) & 0xff;
+
+ const deUint32 r = (r0 + (r1 << 1)) / 3;
+ const deUint32 g = (g0 + (g1 << 1)) / 3;
+ const deUint32 b = (b0 + (b1 << 1)) / 3;
+ const deUint32 a = (a0 + (a1 << 1)) / 3;
+
+ return (r | (g << 8) | (b << 16) | (a << 24));
+}
+
+// Average of two colors
+inline deUint32 averageColor (deUint32 c0, deUint32 c1)
+{
+ const deUint32 r0 = c0 & 0xff;
+ const deUint32 g0 = (c0 >> 8) & 0xff;
+ const deUint32 b0 = (c0 >> 16) & 0xff;
+ const deUint32 a0 = (c0 >> 24) & 0xff;
+
+ const deUint32 r1 = c1 & 0xff;
+ const deUint32 g1 = (c1 >> 8) & 0xff;
+ const deUint32 b1 = (c1 >> 16) & 0xff;
+ const deUint32 a1 = (c1 >> 24) & 0xff;
+
+ const deUint32 r = (r0 + r1) >> 1;
+ const deUint32 g = (g0 + g1) >> 1;
+ const deUint32 b = (b0 + b1) >> 1;
+ const deUint32 a = (a0 + a1) >> 1;
+
+ return (r | (g << 8) | (b << 16) | (a << 24));
+}
+
+inline deInt8 extractModeBc6 (deUint8 src)
+{
+ // Catch illegal modes
+ switch(src & 0x1f)
+ {
+ case 0x13:
+ case 0x17:
+ case 0x1b:
+ case 0x1f:
+ return -1;
+ };
+
+ switch (src & 0x3)
+ {
+ case 0: return 0;
+ case 1: return 1;
+ case 2: return (deInt8)(2 + ((src >> 2) & 0x7));
+ case 3: return (deInt8)(10 + ((src >> 2) & 0x7));
+ };
+
+ return -1;
+}
+
+inline deInt8 extractModeBc7 (deUint8 src)
+{
+ for (deInt8 i = 0; i < 8; i++)
+ if (src & (1 << i))
+ return i;
+
+ return -1;
+}
+
+inline deUint32 getBits128 (deUint64 low, deUint64 high, deUint32 first, deUint32 last)
+{
+ const deUint64 d[2] = { low, high };
+ const bool reverse = first > last;
+ deUint32 ret = 0;
+
+ if (reverse)
+ {
+ const deUint32 tmp = first;
+ first = last;
+ last = tmp;
+ }
+
+ const int elementFirst = first / 64;
+ const int elementLast = last / 64;
+
+ if (elementFirst == elementLast)
+ {
+ // Bits contained in one of the 64bit elements
+ const deUint32 shift = first % 64;
+ const deUint32 len = last - first + 1;
+ const deUint32 mask = (1 << len) - 1;
+ ret = (deUint32)((d[elementFirst] >> shift) & mask);
+ }
+ else
+ {
+ // Bits contained in both of the 64bit elements
+ DE_ASSERT(last > 63);
+ DE_ASSERT(first < 64);
+ const deUint32 len0 = 64 - first;
+ const deUint32 mask0 = (1 << len0) - 1;
+ const deUint32 data0 = (deUint32)(low >> first) & mask0;
+ const deUint32 len1 = last - 63;
+ const deUint32 mask1 = (1 << len1) - 1;
+ const deUint32 data1 = (deUint32)(high & mask1);
+ ret = (deUint32)((data1 << len0) | data0);
+ }
+
+ if (reverse)
+ {
+ const deUint32 len = last - first + 1;
+ const deUint32 orig = ret;
+ ret = 0;
+
+ for (deUint32 i = 0; i < len; i++)
+ {
+ ret |= ((orig >> (len - 1 - i)) & 1) << i;
+ }
+ }
+
+ return ret;
+}
+
+inline deInt32 signExtend (deInt32 value, deInt32 srcBits, deInt32 dstBits)
+{
+ deUint32 sign = value & (1 << (srcBits - 1));
+
+ if (!sign) return value;
+
+ deInt32 dstMask = (deInt32)(((deUint64)1 << dstBits) - 1);
+ deInt32 extendedBits = 0xffffffff << srcBits;
+ return (value | extendedBits) & dstMask;
+}
+
+inline deInt32 unquantize (deInt32 x, int mode, bool hasSign)
+{
+ if (hasSign)
+ {
+ bool s = false;
+
+ if (epBits[mode] >= 16) return x;
+
+ if (x < 0)
+ {
+ s = true;
+ x = -x;
+ }
+
+ if (x == 0)
+ x = 0;
+ else if (x >= (((deInt32)1 << (epBits[mode] - 1)) - 1))
+ x = 0x7fff;
+ else
+ x = (((deInt32)x << 15) + 0x4000) >> (epBits[mode] - 1);
+
+ if (s)
+ x = -x;
+
+ return x;
+ }
+ else
+ {
+ if (epBits[mode] >= 15)
+ return x;
+ else if (x == 0)
+ return 0;
+ else if (x == (((deInt32)1 << epBits[mode]) - 1))
+ return 0xffff;
+ else
+ return ((((deInt32)x << 15) + 0x4000) >> (epBits[mode] - 1));
+ }
+}
+
+inline deInt32 interpolate (deInt32 a, deInt32 b, deUint32 index, deUint32 indexPrecision)
+{
+ const deUint16* weights[] = {weights2, weights3, weights4};
+ const deUint16* weight = weights[indexPrecision-2];
+ DE_ASSERT(indexPrecision >= 2 && indexPrecision <= 4);
+
+ return (((64 - weight[index]) * a + weight[index] * b + 32) >> 6);
+}
+
+inline deInt16 finishUnquantize (deInt32 x, bool hasSign)
+{
+ if (hasSign)
+ {
+ if (x < 0)
+ x = -(((-x) * 31) >> 5);
+ else
+ x = (x * 31) >> 5;
+
+ if (x < 0)
+ x = (-x) | 0x8000;
+ }
+ else
+ {
+ x = (x * 31) / 64;
+ }
+
+ return (deInt16)x;
+}
+
+} // BcDecompressInternal
+
+void decompressBc1 (const PixelBufferAccess& dst, const deUint8* src, bool hasAlpha)
+{
+ using namespace BcDecompressInternal;
+
+ deUint8* const dstPtr = (deUint8*)dst.getDataPtr();
+ const deUint32 dstRowPitch = dst.getRowPitch();
+ const deUint32 dstPixelSize = 4;
+ const deUint16 color0_16 = ((deUint16*)src)[0];
+ const deUint16 color1_16 = ((deUint16*)src)[1];
+ const deUint32 color0 = bgr16torgba32(color0_16);
+ const deUint32 color1 = bgr16torgba32(color1_16);
+ const deUint8* const indices8 = &src[4];
+
+ const bool alphaMode = color1_16 > color0_16;
+
+ const deInt32 indices[16] =
+ {
+ (indices8[0] >> 0) & 0x3,
+ (indices8[0] >> 2) & 0x3,
+ (indices8[0] >> 4) & 0x3,
+ (indices8[0] >> 6) & 0x3,
+ (indices8[1] >> 0) & 0x3,
+ (indices8[1] >> 2) & 0x3,
+ (indices8[1] >> 4) & 0x3,
+ (indices8[1] >> 6) & 0x3,
+ (indices8[2] >> 0) & 0x3,
+ (indices8[2] >> 2) & 0x3,
+ (indices8[2] >> 4) & 0x3,
+ (indices8[2] >> 6) & 0x3,
+ (indices8[3] >> 0) & 0x3,
+ (indices8[3] >> 2) & 0x3,
+ (indices8[3] >> 4) & 0x3,
+ (indices8[3] >> 6) & 0x3
+ };
+
+ const deUint32 colors[4] =
+ {
+ color0,
+ color1,
+ alphaMode ? averageColor(color0, color1) : interpolateColor(color1, color0),
+ alphaMode ? (hasAlpha ? 0 : 0xff000000) : interpolateColor(color0, color1)
+ };
+
+ for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++)
+ {
+ for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++)
+ {
+ deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize);
+ *dstPixel = colors[indices[y * BC_BLOCK_WIDTH + x]];
+ }
+ }
+}
+
+void decompressBc2 (const PixelBufferAccess& dst, const deUint8* src)
+{
+ using namespace BcDecompressInternal;
+
+ deUint8* const dstPtr = (deUint8*)dst.getDataPtr();
+ const deUint32 dstRowPitch = dst.getRowPitch();
+ const deUint32 dstPixelSize = 4;
+ const deUint16 color0_16 = ((deUint16*)src)[4];
+ const deUint16 color1_16 = ((deUint16*)src)[5];
+ const deUint32 color0 = bgr16torgba32(color0_16);
+ const deUint32 color1 = bgr16torgba32(color1_16);
+ const deUint8* const indices8 = &src[12];
+ const deUint8* const alphas8 = src;
+
+ const deInt32 indices[16] =
+ {
+ (indices8[0] >> 0) & 0x3,
+ (indices8[0] >> 2) & 0x3,
+ (indices8[0] >> 4) & 0x3,
+ (indices8[0] >> 6) & 0x3,
+ (indices8[1] >> 0) & 0x3,
+ (indices8[1] >> 2) & 0x3,
+ (indices8[1] >> 4) & 0x3,
+ (indices8[1] >> 6) & 0x3,
+ (indices8[2] >> 0) & 0x3,
+ (indices8[2] >> 2) & 0x3,
+ (indices8[2] >> 4) & 0x3,
+ (indices8[2] >> 6) & 0x3,
+ (indices8[3] >> 0) & 0x3,
+ (indices8[3] >> 2) & 0x3,
+ (indices8[3] >> 4) & 0x3,
+ (indices8[3] >> 6) & 0x3
+ };
+
+ const deInt32 alphas[16] =
+ {
+ extend4To8(((alphas8[0] >> 0) & 0xf)) << 24,
+ extend4To8(((alphas8[0] >> 4) & 0xf)) << 24,
+ extend4To8(((alphas8[1] >> 0) & 0xf)) << 24,
+ extend4To8(((alphas8[1] >> 4) & 0xf)) << 24,
+ extend4To8(((alphas8[2] >> 0) & 0xf)) << 24,
+ extend4To8(((alphas8[2] >> 4) & 0xf)) << 24,
+ extend4To8(((alphas8[3] >> 0) & 0xf)) << 24,
+ extend4To8(((alphas8[3] >> 4) & 0xf)) << 24,
+ extend4To8(((alphas8[4] >> 0) & 0xf)) << 24,
+ extend4To8(((alphas8[4] >> 4) & 0xf)) << 24,
+ extend4To8(((alphas8[5] >> 0) & 0xf)) << 24,
+ extend4To8(((alphas8[5] >> 4) & 0xf)) << 24,
+ extend4To8(((alphas8[6] >> 0) & 0xf)) << 24,
+ extend4To8(((alphas8[6] >> 4) & 0xf)) << 24,
+ extend4To8(((alphas8[7] >> 0) & 0xf)) << 24,
+ extend4To8(((alphas8[7] >> 4) & 0xf)) << 24
+ };
+
+ const deUint32 colors[4] =
+ {
+ color0,
+ color1,
+ interpolateColor(color1, color0),
+ interpolateColor(color0, color1)
+ };
+
+ for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++)
+ {
+ for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++)
+ {
+ deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize);
+ *dstPixel = (colors[indices[y * BC_BLOCK_WIDTH + x]] & 0x00ffffff) | alphas[y * BC_BLOCK_WIDTH + x];
+ }
+ }
+}
+
+void decompressBc3 (const PixelBufferAccess& dst, const deUint8* src)
+{
+ using namespace BcDecompressInternal;
+
+ deUint8* const dstPtr = (deUint8*)dst.getDataPtr();
+ const deUint32 dstRowPitch = dst.getRowPitch();
+ const deUint32 dstPixelSize = 4;
+ const deUint8 alpha0 = src[0];
+ const deUint8 alpha1 = src[1];
+ const deUint16 color0_16 = ((deUint16*)src)[4];
+ const deUint16 color1_16 = ((deUint16*)src)[5];
+ const deUint32 color0 = bgr16torgba32(color0_16);
+ const deUint32 color1 = bgr16torgba32(color1_16);
+ const deUint8* const indices8 = &src[12];
+ const deUint64 alphaBits = *((deUint64*)&src[2]);
+ deUint32 alphas[8];
+
+ const deInt32 indices[16] =
+ {
+ (indices8[0] >> 0) & 0x3,
+ (indices8[0] >> 2) & 0x3,
+ (indices8[0] >> 4) & 0x3,
+ (indices8[0] >> 6) & 0x3,
+ (indices8[1] >> 0) & 0x3,
+ (indices8[1] >> 2) & 0x3,
+ (indices8[1] >> 4) & 0x3,
+ (indices8[1] >> 6) & 0x3,
+ (indices8[2] >> 0) & 0x3,
+ (indices8[2] >> 2) & 0x3,
+ (indices8[2] >> 4) & 0x3,
+ (indices8[2] >> 6) & 0x3,
+ (indices8[3] >> 0) & 0x3,
+ (indices8[3] >> 2) & 0x3,
+ (indices8[3] >> 4) & 0x3,
+ (indices8[3] >> 6) & 0x3
+ };
+
+ const deInt32 alphaIndices[16] =
+ {
+ (deInt32)((alphaBits >> 0) & 0x7),
+ (deInt32)((alphaBits >> 3) & 0x7),
+ (deInt32)((alphaBits >> 6) & 0x7),
+ (deInt32)((alphaBits >> 9) & 0x7),
+ (deInt32)((alphaBits >> 12) & 0x7),
+ (deInt32)((alphaBits >> 15) & 0x7),
+ (deInt32)((alphaBits >> 18) & 0x7),
+ (deInt32)((alphaBits >> 21) & 0x7),
+ (deInt32)((alphaBits >> 24) & 0x7),
+ (deInt32)((alphaBits >> 27) & 0x7),
+ (deInt32)((alphaBits >> 30) & 0x7),
+ (deInt32)((alphaBits >> 33) & 0x7),
+ (deInt32)((alphaBits >> 36) & 0x7),
+ (deInt32)((alphaBits >> 39) & 0x7),
+ (deInt32)((alphaBits >> 42) & 0x7),
+ (deInt32)((alphaBits >> 45) & 0x7)
+ };
+
+ const deUint32 colors[4] =
+ {
+ color0,
+ color1,
+ interpolateColor(color1, color0),
+ interpolateColor(color0, color1)
+ };
+
+ alphas[0] = alpha0 << 24;
+ alphas[1] = alpha1 << 24;
+
+ if (alpha0 > alpha1)
+ {
+ for (deUint32 i = 0; i < 6; i++)
+ alphas[i + 2] = (((deUint32)alpha0 * (6 - i) + (deUint32)alpha1 * (1 + i)) / 7) << 24;
+ }
+ else
+ {
+ for (deUint32 i = 0; i < 4; i++)
+ alphas[i + 2] = (((deUint32)alpha0 * (4 - i) + (deUint32)alpha1 * (1 + i)) / 5) << 24;
+ alphas[6] = 0;
+ alphas[7] = 0xff000000;
+ }
+
+ for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++)
+ {
+ for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++)
+ {
+ deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize);
+ *dstPixel = (colors[indices[y * BC_BLOCK_WIDTH + x]] & 0x00ffffff) | alphas[alphaIndices[y * BC_BLOCK_WIDTH + x]];
+ }
+ }
+}
+
+void decompressBc4 (const PixelBufferAccess& dst, const deUint8* src, bool hasSign)
+{
+ using namespace BcDecompressInternal;
+
+ deUint8* const dstPtr = (deUint8*)dst.getDataPtr();
+ const deUint32 dstRowPitch = dst.getRowPitch();
+ const deUint32 dstPixelSize = 4;
+ const deUint8 red0 = src[0];
+ const deUint8 red1 = src[1];
+ const deInt8 red0s = ((deInt8*)src)[0];
+ const deInt8 red1s = ((deInt8*)src)[1];
+ const deUint64 indexBits = *((deUint64*)&src[2]);
+ float reds[8];
+
+ const deInt32 indices[16] =
+ {
+ (deInt32)((indexBits >> 0) & 0x7),
+ (deInt32)((indexBits >> 3) & 0x7),
+ (deInt32)((indexBits >> 6) & 0x7),
+ (deInt32)((indexBits >> 9) & 0x7),
+ (deInt32)((indexBits >> 12) & 0x7),
+ (deInt32)((indexBits >> 15) & 0x7),
+ (deInt32)((indexBits >> 18) & 0x7),
+ (deInt32)((indexBits >> 21) & 0x7),
+ (deInt32)((indexBits >> 24) & 0x7),
+ (deInt32)((indexBits >> 27) & 0x7),
+ (deInt32)((indexBits >> 30) & 0x7),
+ (deInt32)((indexBits >> 33) & 0x7),
+ (deInt32)((indexBits >> 36) & 0x7),
+ (deInt32)((indexBits >> 39) & 0x7),
+ (deInt32)((indexBits >> 42) & 0x7),
+ (deInt32)((indexBits >> 45) & 0x7)
+ };
+
+ reds[0] = hasSign ? int8ToFloat(red0s) : uint8ToFloat(red0);
+ reds[1] = hasSign ? int8ToFloat(red1s) : uint8ToFloat(red1);
+
+ if (reds[0] > reds[1])
+ {
+ for (deUint32 i = 0; i < 6; i++)
+ reds[i + 2] = (reds[0] * (6.0f - (float)i) + reds[1] * (1.0f + (float)i)) / 7.0f;
+ }
+ else
+ {
+ for (deUint32 i = 0; i < 4; i++)
+ reds[i + 2] = (reds[0] * (4.0f - (float)i) + reds[1] * (1.0f + (float)i)) / 5.0f;
+ reds[6] = hasSign ? -1.0f : 0.0f;
+ reds[7] = 1.0f;
+ }
+
+ for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++)
+ {
+ for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++)
+ {
+ float* const dstPixel = (float*)(dstPtr + y * dstRowPitch + x * dstPixelSize);
+ *dstPixel = reds[indices[y * BC_BLOCK_WIDTH + x]];
+ }
+ }
+}
+
+void decompressBc5 (const PixelBufferAccess& dst, const deUint8* src, bool hasSign)
+{
+ using namespace BcDecompressInternal;
+
+ deUint8* const dstPtr = (deUint8*)dst.getDataPtr();
+ const deUint32 dstRowPitch = dst.getRowPitch();
+ const deUint32 dstPixelSize = 8;
+ float rg[2][8];
+ deUint32 indices[2][16];
+
+ for (deUint32 c = 0; c < 2; c++)
+ {
+ const deUint32 offset = c * 8;
+ const deUint8 rg0 = src[offset];
+ const deUint8 rg1 = src[offset + 1];
+ const deInt8 rg0s = ((deInt8*)src)[offset];
+ const deInt8 rg1s = ((deInt8*)src)[offset + 1];
+ const deUint64 indexBits = *((deUint64*)&src[offset + 2]);
+
+ for (deUint32 i = 0; i < 16; i++)
+ indices[c][i] = (indexBits >> (i * 3)) & 0x7;
+
+ rg[c][0] = hasSign ? int8ToFloat(rg0s) : uint8ToFloat(rg0);
+ rg[c][1] = hasSign ? int8ToFloat(rg1s) : uint8ToFloat(rg1);
+
+ if (rg[c][0] > rg[c][1])
+ {
+ for (deUint32 i = 0; i < 6; i++)
+ rg[c][i + 2] = (rg[c][0] * (6.0f - (float)i) + rg[c][1] * (1.0f + (float)i)) / 7.0f;
+ }
+ else
+ {
+ for (deUint32 i = 0; i < 4; i++)
+ rg[c][i + 2] = (rg[c][0] * (4.0f - (float)i) + rg[c][1] * (1.0f + (float)i)) / 5.0f;
+ rg[c][6] = hasSign ? -1.0f : 0.0f;
+ rg[c][7] = 1.0f;
+ }
+ }
+
+ for (deUint32 y = 0; y < (deUint32)BC_BLOCK_HEIGHT; y++)
+ {
+ for (deUint32 x = 0; x < (deUint32)BC_BLOCK_WIDTH; x++)
+ {
+ float* const dstPixel = (float*)(dstPtr + y * dstRowPitch + x * dstPixelSize);
+ for (deUint32 i = 0; i < 2; i++)
+ dstPixel[i] = rg[i][indices[i][y * BC_BLOCK_WIDTH + x]];
+ }
+ }
+}
+
+void decompressBc6H (const PixelBufferAccess& dst, const deUint8* src, bool hasSign)
+{
+ using namespace BcDecompressInternal;
+
+ deUint8* const dstPtr = (deUint8*)dst.getDataPtr();
+ const deUint32 dstRowPitch = dst.getRowPitch();
+ const deUint32 dstPixelSize = 6;
+
+ deInt32 mode = extractModeBc6(src[0]);
+ IVec4 r (0);
+ IVec4 g (0);
+ IVec4 b (0);
+ deUint32 deltaBitsR = 0;
+ deUint32 deltaBitsG = 0;
+ deUint32 deltaBitsB = 0;
+ const deUint64 low = ((deUint64*)src)[0];
+ const deUint64 high = ((deUint64*)src)[1];
+ const deUint32 d = mode < 10 ? getBits128(low, high, 77, 81) : 0;
+ const deUint32 numRegions = mode > 9 ? 1 : 2;
+ const deUint32 numEndpoints = numRegions * 2;
+ const bool transformed = mode != 9 && mode != 10;
+ const deUint32 colorIndexBC = mode < 10 ? 3 : 4;
+ deUint64 colorIndexData = high >> (mode < 10 ? 18 : 1);
+ const deUint32 anchorIndex[2] = { 0, anchorIndicesSecondSubset2[d] };
+
+ switch (mode)
+ {
+ case 0:
+ g[2] |= getBits128(low, high, 2, 2) << 4;
+ b[2] |= getBits128(low, high, 3, 3) << 4;
+ b[3] |= getBits128(low, high, 4, 4) << 4;
+ r[0] |= getBits128(low, high, 5, 14);
+ g[0] |= getBits128(low, high, 15, 24);
+ b[0] |= getBits128(low, high, 25, 34);
+ r[1] |= getBits128(low, high, 35, 39);
+ g[3] |= getBits128(low, high, 40, 40) << 4;
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 49);
+ b[3] |= getBits128(low, high, 50, 50);
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 59);
+ b[3] |= getBits128(low, high, 60, 60) << 1;
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 69);
+ b[3] |= getBits128(low, high, 70, 70) << 2;
+ r[3] |= getBits128(low, high, 71, 75);
+ b[3] |= getBits128(low, high, 76, 76) << 3;
+ deltaBitsR = deltaBitsG = deltaBitsB = 5;
+ break;
+
+ case 1:
+ g[2] |= getBits128(low, high, 2, 2) << 5;
+ g[3] |= getBits128(low, high, 3, 3) << 4;
+ g[3] |= getBits128(low, high, 4, 4) << 5;
+ r[0] |= getBits128(low, high, 5, 11);
+ b[3] |= getBits128(low, high, 12, 12);
+ b[3] |= getBits128(low, high, 13, 13) << 1;
+ b[2] |= getBits128(low, high, 14, 14) << 4;
+ g[0] |= getBits128(low, high, 15, 21);
+ b[2] |= getBits128(low, high, 22, 22) << 5;
+ b[3] |= getBits128(low, high, 23, 23) << 2;
+ g[2] |= getBits128(low, high, 24, 24) << 4;
+ b[0] |= getBits128(low, high, 25, 31);
+ b[3] |= getBits128(low, high, 32, 32) << 3;
+ b[3] |= getBits128(low, high, 33, 33) << 5;
+ b[3] |= getBits128(low, high, 34, 34) << 4;
+ r[1] |= getBits128(low, high, 35, 40);
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 50);
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 60);
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 70);
+ r[3] |= getBits128(low, high, 71, 76);
+ deltaBitsR = deltaBitsG = deltaBitsB = 6;
+ break;
+
+ case 2:
+ r[0] |= getBits128(low, high, 5, 14);
+ g[0] |= getBits128(low, high, 15, 24);
+ b[0] |= getBits128(low, high, 25, 34);
+ r[1] |= getBits128(low, high, 35, 39);
+ r[0] |= getBits128(low, high, 40, 40) << 10;
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 48);
+ g[0] |= getBits128(low, high, 49, 49) << 10;
+ b[3] |= getBits128(low, high, 50, 50);
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 58);
+ b[0] |= getBits128(low, high, 59, 59) << 10;
+ b[3] |= getBits128(low, high, 60, 60) << 1;
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 69);
+ b[3] |= getBits128(low, high, 70, 70) << 2;
+ r[3] |= getBits128(low, high, 71, 75);
+ b[3] |= getBits128(low, high, 76, 76) << 3;
+ deltaBitsR = 5;
+ deltaBitsG = deltaBitsB = 4;
+ break;
+
+ case 3:
+ r[0] |= getBits128(low, high, 5, 14);
+ g[0] |= getBits128(low, high, 15, 24);
+ b[0] |= getBits128(low, high, 25, 34);
+ r[1] |= getBits128(low, high, 35, 38);
+ r[0] |= getBits128(low, high, 39, 39) << 10;
+ g[3] |= getBits128(low, high, 40, 40) << 4;
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 49);
+ g[0] |= getBits128(low, high, 50, 50) << 10;
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 58);
+ b[0] |= getBits128(low, high, 59, 59) << 10;
+ b[3] |= getBits128(low, high, 60, 60) << 1;
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 68);
+ b[3] |= getBits128(low, high, 69, 69);
+ b[3] |= getBits128(low, high, 70, 70) << 2;
+ r[3] |= getBits128(low, high, 71, 74);
+ g[2] |= getBits128(low, high, 75, 75) << 4;
+ b[3] |= getBits128(low, high, 76, 76) << 3;
+ deltaBitsR = deltaBitsB = 4;
+ deltaBitsG = 5;
+ break;
+
+ case 4:
+ r[0] |= getBits128(low, high, 5, 14);
+ g[0] |= getBits128(low, high, 15, 24);
+ b[0] |= getBits128(low, high, 25, 34);
+ r[1] |= getBits128(low, high, 35, 38);
+ r[0] |= getBits128(low, high, 39, 39) << 10;
+ b[2] |= getBits128(low, high, 40, 40) << 4;
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 48);
+ g[0] |= getBits128(low, high, 49, 49) << 10;
+ b[3] |= getBits128(low, high, 50, 50);
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 59);
+ b[0] |= getBits128(low, high, 60, 60) << 10;
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 68);
+ b[3] |= getBits128(low, high, 69, 69) << 1;
+ b[3] |= getBits128(low, high, 70, 70) << 2;
+ r[3] |= getBits128(low, high, 71, 74);
+ b[3] |= getBits128(low, high, 75, 75) << 4;
+ b[3] |= getBits128(low, high, 76, 76) << 3;
+ deltaBitsR = deltaBitsG = 4;
+ deltaBitsB = 5;
+ break;
+
+ case 5:
+ r[0] |= getBits128(low, high, 5, 13);
+ b[2] |= getBits128(low, high, 14, 14) << 4;
+ g[0] |= getBits128(low, high, 15, 23);
+ g[2] |= getBits128(low, high, 24, 24) << 4;
+ b[0] |= getBits128(low, high, 25, 33);
+ b[3] |= getBits128(low, high, 34, 34) << 4;
+ r[1] |= getBits128(low, high, 35, 39);
+ g[3] |= getBits128(low, high, 40, 40) << 4;
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 49);
+ b[3] |= getBits128(low, high, 50, 50);
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 59);
+ b[3] |= getBits128(low, high, 60, 60) << 1;
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 69);
+ b[3] |= getBits128(low, high, 70, 70) << 2;
+ r[3] |= getBits128(low, high, 71, 75);
+ b[3] |= getBits128(low, high, 76, 76) << 3;
+ deltaBitsR = deltaBitsG = deltaBitsB = 5;
+ break;
+
+ case 6:
+ r[0] |= getBits128(low, high, 5, 12);
+ g[3] |= getBits128(low, high, 13, 13) << 4;
+ b[2] |= getBits128(low, high, 14, 14) << 4;
+ g[0] |= getBits128(low, high, 15, 22);
+ b[3] |= getBits128(low, high, 23, 23) << 2;
+ g[2] |= getBits128(low, high, 24, 24) << 4;
+ b[0] |= getBits128(low, high, 25, 32);
+ b[3] |= getBits128(low, high, 33, 33) << 3;
+ b[3] |= getBits128(low, high, 34, 34) << 4;
+ r[1] |= getBits128(low, high, 35, 40);
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 49);
+ b[3] |= getBits128(low, high, 50, 50);
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 59);
+ b[3] |= getBits128(low, high, 60, 60) << 1;
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 70);
+ r[3] |= getBits128(low, high, 71, 76);
+ deltaBitsR = 6;
+ deltaBitsG = deltaBitsB = 5;
+ break;
+
+ case 7:
+ r[0] |= getBits128(low, high, 5, 12);
+ b[3] |= getBits128(low, high, 13, 13);
+ b[2] |= getBits128(low, high, 14, 14) << 4;
+ g[0] |= getBits128(low, high, 15, 22);
+ g[2] |= getBits128(low, high, 23, 23) << 5;
+ g[2] |= getBits128(low, high, 24, 24) << 4;
+ b[0] |= getBits128(low, high, 25, 32);
+ g[3] |= getBits128(low, high, 33, 33) << 5;
+ b[3] |= getBits128(low, high, 34, 34) << 4;
+ r[1] |= getBits128(low, high, 35, 39);
+ g[3] |= getBits128(low, high, 40, 40) << 4;
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 50);
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 59);
+ b[3] |= getBits128(low, high, 60, 60) << 1;
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 69);
+ b[3] |= getBits128(low, high, 70, 70) << 2;
+ r[3] |= getBits128(low, high, 71, 75);
+ b[3] |= getBits128(low, high, 76, 76) << 3;
+ deltaBitsR = deltaBitsB = 5;
+ deltaBitsG = 6;
+ break;
+
+ case 8:
+ r[0] |= getBits128(low, high, 5, 12);
+ b[3] |= getBits128(low, high, 13, 13) << 1;
+ b[2] |= getBits128(low, high, 14, 14) << 4;
+ g[0] |= getBits128(low, high, 15, 22);
+ b[2] |= getBits128(low, high, 23, 23) << 5;
+ g[2] |= getBits128(low, high, 24, 24) << 4;
+ b[0] |= getBits128(low, high, 25, 32);
+ b[3] |= getBits128(low, high, 33, 33) << 5;
+ b[3] |= getBits128(low, high, 34, 34) << 4;
+ r[1] |= getBits128(low, high, 35, 39);
+ g[3] |= getBits128(low, high, 40, 40) << 4;
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 49);
+ b[3] |= getBits128(low, high, 50, 50);
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 60);
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 69);
+ b[3] |= getBits128(low, high, 70, 70) << 2;
+ r[3] |= getBits128(low, high, 71, 75);
+ b[3] |= getBits128(low, high, 76, 76) << 3;
+ deltaBitsR = deltaBitsG = 5;
+ deltaBitsB = 6;
+ break;
+
+ case 9:
+ r[0] |= getBits128(low, high, 5, 10);
+ g[3] |= getBits128(low, high, 11, 11) << 4;
+ b[3] |= getBits128(low, high, 12, 13);
+ b[2] |= getBits128(low, high, 14, 14) << 4;
+ g[0] |= getBits128(low, high, 15, 20);
+ g[2] |= getBits128(low, high, 21, 21) << 5;
+ b[2] |= getBits128(low, high, 22, 22) << 5;
+ b[3] |= getBits128(low, high, 23, 23) << 2;
+ g[2] |= getBits128(low, high, 24, 24) << 4;
+ b[0] |= getBits128(low, high, 25, 30);
+ g[3] |= getBits128(low, high, 31, 31) << 5;
+ b[3] |= getBits128(low, high, 32, 32) << 3;
+ b[3] |= getBits128(low, high, 33, 33) << 5;
+ b[3] |= getBits128(low, high, 34, 34) << 4;
+ r[1] |= getBits128(low, high, 35, 40);
+ g[2] |= getBits128(low, high, 41, 44);
+ g[1] |= getBits128(low, high, 45, 50);
+ g[3] |= getBits128(low, high, 51, 54);
+ b[1] |= getBits128(low, high, 55, 60);
+ b[2] |= getBits128(low, high, 61, 64);
+ r[2] |= getBits128(low, high, 65, 70);
+ r[3] |= getBits128(low, high, 71, 76);
+ deltaBitsR = deltaBitsG = deltaBitsB = 6;
+ break;
+
+ case 10:
+ r[0] |= getBits128(low, high, 5, 14);
+ g[0] |= getBits128(low, high, 15, 24);
+ b[0] |= getBits128(low, high, 25, 34);
+ r[1] |= getBits128(low, high, 35, 44);
+ g[1] |= getBits128(low, high, 45, 54);
+ b[1] |= getBits128(low, high, 55, 64);
+ deltaBitsR = deltaBitsG = deltaBitsB = 10;
+ break;
+
+ case 11:
+ r[0] |= getBits128(low, high, 5, 14);
+ g[0] |= getBits128(low, high, 15, 24);
+ b[0] |= getBits128(low, high, 25, 34);
+ r[1] |= getBits128(low, high, 35, 43);
+ r[0] |= getBits128(low, high, 44, 44) << 10;
+ g[1] |= getBits128(low, high, 45, 53);
+ g[0] |= getBits128(low, high, 54, 54) << 10;
+ b[1] |= getBits128(low, high, 55, 63);
+ b[0] |= getBits128(low, high, 64, 64) << 10;
+ deltaBitsR = deltaBitsG = deltaBitsB = 9;
+ break;
+
+ case 12:
+ r[0] |= getBits128(low, high, 5, 14);
+ g[0] |= getBits128(low, high, 15, 24);
+ b[0] |= getBits128(low, high, 25, 34);
+ r[1] |= getBits128(low, high, 35, 42);
+ r[0] |= getBits128(low, high, 44, 43) << 10;
+ g[1] |= getBits128(low, high, 45, 52);
+ g[0] |= getBits128(low, high, 54, 53) << 10;
+ b[1] |= getBits128(low, high, 55, 62);
+ b[0] |= getBits128(low, high, 64, 63) << 10;
+ deltaBitsR = deltaBitsG = deltaBitsB = 8;
+ break;
+
+ case 13:
+ r[0] |= getBits128(low, high, 5, 14);
+ g[0] |= getBits128(low, high, 15, 24);
+ b[0] |= getBits128(low, high, 25, 34);
+ r[1] |= getBits128(low, high, 35, 38);
+ r[0] |= getBits128(low, high, 44, 39) << 10;
+ g[1] |= getBits128(low, high, 45, 48);
+ g[0] |= getBits128(low, high, 54, 49) << 10;
+ b[1] |= getBits128(low, high, 55, 58);
+ b[0] |= getBits128(low, high, 64, 59) << 10;
+ deltaBitsR = deltaBitsG = deltaBitsB = 4;
+ break;
+ };
+
+ if (hasSign)
+ {
+ r[0] = signExtend(r[0], epBits[mode], 32);
+ g[0] = signExtend(g[0], epBits[mode], 32);
+ b[0] = signExtend(b[0], epBits[mode], 32);
+ }
+
+ if (transformed)
+ {
+ for (deUint32 i = 1; i < numEndpoints; i++)
+ {
+ r[i] = signExtend(r[i], deltaBitsR, 32);
+ r[i] = (r[0] + r[i]) & (((deUint32)1 << epBits[mode]) - 1);
+ g[i] = signExtend(g[i], deltaBitsG, 32);
+ g[i] = (g[0] + g[i]) & (((deUint32)1 << epBits[mode]) - 1);
+ b[i] = signExtend(b[i], deltaBitsB, 32);
+ b[i] = (b[0] + b[i]) & (((deUint32)1 << epBits[mode]) - 1);
+ }
+ }
+
+ if (hasSign)
+ {
+ for (deUint32 i = 1; i < 4; i++)
+ {
+ r[i] = signExtend(r[i], epBits[mode], 32);
+ g[i] = signExtend(g[i], epBits[mode], 32);
+ b[i] = signExtend(b[i], epBits[mode], 32);
+ }
+ }
+
+ for (deUint32 i = 0; i < numEndpoints; i++)
+ {
+ r[i] = unquantize(r[i], mode, hasSign);
+ g[i] = unquantize(g[i], mode, hasSign);
+ b[i] = unquantize(b[i], mode, hasSign);
+ }
+
+ for (deUint32 i = 0; i < 16; i++)
+ {
+ const deUint32 subsetIndex = (numRegions == 1 ? 0 : partitions2[d][i]);
+ const deUint32 bits = (i == anchorIndex[subsetIndex]) ? (colorIndexBC - 1) : colorIndexBC;
+ const deUint32 colorIndex = (deUint32)(colorIndexData & ((1 << bits) - 1));
+ const deInt32 endpointStartR = r[2 * subsetIndex];
+ const deInt32 endpointEndR = r[2 * subsetIndex + 1];
+ const deInt32 endpointStartG = g[2 * subsetIndex];
+ const deInt32 endpointEndG = g[2 * subsetIndex + 1];
+ const deInt32 endpointStartB = b[2 * subsetIndex];
+ const deInt32 endpointEndB = b[2 * subsetIndex + 1];
+ const deInt16 r16 = finishUnquantize(interpolate(endpointStartR, endpointEndR, colorIndex, colorIndexBC), hasSign);
+ const deInt16 g16 = finishUnquantize(interpolate(endpointStartG, endpointEndG, colorIndex, colorIndexBC), hasSign);
+ const deInt16 b16 = finishUnquantize(interpolate(endpointStartB, endpointEndB, colorIndex, colorIndexBC), hasSign);
+ const deInt32 y = i / 4;
+ const deInt32 x = i % 4;
+ deInt16* const dstPixel = (deInt16*)(dstPtr + y * dstRowPitch + x * dstPixelSize);
+
+ if (mode == -1)
+ {
+ dstPixel[0] = 0;
+ dstPixel[1] = 0;
+ dstPixel[2] = 0;
+ }
+ else
+ {
+ dstPixel[0] = r16;
+ dstPixel[1] = g16;
+ dstPixel[2] = b16;
+ }
+
+ colorIndexData >>= bits;
+ }
+}
+
+void decompressBc7 (const PixelBufferAccess& dst, const deUint8* src)
+{
+ using namespace BcDecompressInternal;
+
+ static const deUint8 subsets[] = { 3, 2, 3, 2, 1, 1, 1, 2 };
+ static const deUint8 partitionBits[] = { 4, 6, 6, 6, 0, 0, 0, 6 };
+ static const deUint8 endpointBits[8][5] =
+ {
+ //r, g, b, a, p
+ { 4, 4, 4, 0, 1 },
+ { 6, 6, 6, 0, 1 },
+ { 5, 5, 5, 0, 0 },
+ { 7, 7, 7, 0, 1 },
+ { 5, 5, 5, 6, 0 },
+ { 7, 7, 7, 8, 0 },
+ { 7, 7, 7, 7, 1 },
+ { 5, 5, 5, 5, 1 }
+ };
+ static const deUint8 indexBits[] = { 3, 3, 2, 2, 2, 2, 4, 2 };
+
+ deUint8* const dstPtr = (deUint8*)dst.getDataPtr();
+ const deUint32 dstRowPitch = dst.getRowPitch();
+ const deUint32 dstPixelSize = 4;
+
+ const deUint64 low = ((deUint64*)src)[0];
+ const deUint64 high = ((deUint64*)src)[1];
+ const deInt32 mode = extractModeBc7(src[0]);
+ deUint32 numSubsets = 1;
+ deUint32 offset = mode + 1;
+ deUint32 rotation = 0;
+ deUint32 idxMode = 0;
+ deUint32 endpoints[6][5];
+ deUint32 partitionSetId = 0;
+
+ // Decode partition data from explicit partition bits
+ if (mode == 0 || mode == 1 || mode == 2 || mode == 3 || mode == 7)
+ {
+ numSubsets = subsets[mode];
+ partitionSetId = getBits128(low, high, offset, offset + partitionBits[mode] - 1);
+ offset += partitionBits[mode];
+ }
+
+ // Extract rotation bits
+ if (mode == 4 || mode == 5)
+ {
+ rotation = getBits128(low, high, offset, offset + 1);
+ offset += 2;
+ if (mode == 4)
+ {
+ idxMode = getBits128(low, high, offset, offset);
+ offset++;
+ }
+ }
+
+ {
+ const deUint32 numEndpoints = numSubsets * 2;
+
+ // Extract raw, compressed endpoint bits
+ for (deUint32 cpnt = 0; cpnt < 5; cpnt++)
+ {
+ for (deUint32 ep = 0; ep < numEndpoints; ep++)
+ {
+ if (mode == 1 && cpnt == 4 && ep > 1)
+ continue; // Mode 1 has shared P bits
+
+ int n = mode == -1 ? 0 : endpointBits[mode][cpnt];
+ if (n > 0)
+ endpoints[ep][cpnt] = getBits128(low, high, offset, offset + n - 1);
+ offset += n;
+ }
+ }
+
+ // Decode endpoints
+ if (mode == 0 || mode == 1 || mode == 3 || mode == 6 || mode == 7)
+ {
+ // First handle modes that have P-bits
+ for (deUint32 ep = 0; ep < numEndpoints; ep++)
+ {
+ for (deUint32 cpnt = 0; cpnt < 4; cpnt++)
+ {
+ endpoints[ep][cpnt] <<= 1;
+ }
+ }
+
+ if (mode == 1)
+ {
+ // P-bit is shared
+ const deUint32 pbitZero = endpoints[0][4];
+ const deUint32 pbitOne = endpoints[1][4];
+
+ for (deUint32 cpnt = 0; cpnt < 3; cpnt++)
+ {
+ endpoints[0][cpnt] |= pbitZero;
+ endpoints[1][cpnt] |= pbitZero;
+ endpoints[2][cpnt] |= pbitOne;
+ endpoints[3][cpnt] |= pbitOne;
+ }
+ }
+ else
+ {
+ // Unique p-bit per endpoint
+ for (deUint32 ep = 0; ep < numEndpoints; ep++)
+ {
+ for (deUint32 cpnt = 0; cpnt < 4; cpnt++)
+ {
+ endpoints[ep][cpnt] |= endpoints[ep][4];
+ }
+ }
+ }
+ }
+
+ for (deUint32 ep = 0; ep < numEndpoints; ep++)
+ {
+ // Left shift endpoint components so that their MSB lies in bit 7
+ for (deUint32 cpnt = 0; cpnt < 4; cpnt++)
+ endpoints[ep][cpnt] <<= 8 - (endpointBits[mode][cpnt] + endpointBits[mode][4]);
+
+ // Replicate each component's MSB into the LSBs revealed by the left-shift operation above
+ for (deUint32 cpnt = 0; cpnt < 4; cpnt++)
+ endpoints[ep][cpnt] |= endpoints[ep][cpnt] >> (endpointBits[mode][cpnt] + endpointBits[mode][4]);
+ }
+
+ // If this mode does not explicitly define the alpha component set alpha equal to 1.0
+ if (mode < 4)
+ {
+ for (deUint32 ep = 0; ep < numEndpoints; ep++)
+ endpoints[ep][3] = 255;
+ }
+ }
+
+ {
+ deUint32 colorIdxOffset = offset + ((mode == 4 && idxMode) ? 31 : 0);
+ deUint32 alphaIdxOffset = offset + ((mode == 5 || (mode == 4 && !idxMode)) ? 31 : 0);
+
+ for (deUint32 pixel = 0; pixel < 16; pixel++)
+ {
+ const deUint32 y = pixel / 4;
+ const deUint32 x = pixel % 4;
+ deUint32* const dstPixel = (deUint32*)(dstPtr + y * dstRowPitch + x * dstPixelSize);
+ deUint32 subsetIndex = 0;
+ deUint32 anchorIndex = 0;
+ deUint32 endpointStart[4];
+ deUint32 endpointEnd[4];
+
+ if (mode == -1)
+ {
+ *dstPixel = 0;
+ continue;
+ }
+
+ if (numSubsets == 2)
+ subsetIndex = partitions2[partitionSetId][pixel];
+ else if (numSubsets == 3)
+ subsetIndex = partitions3[partitionSetId][pixel];
+
+ if (numSubsets == 2 && subsetIndex == 1)
+ {
+ anchorIndex = anchorIndicesSecondSubset2[partitionSetId];
+ }
+ else if (numSubsets == 3)
+ {
+ if (subsetIndex == 1)
+ anchorIndex = anchorIndicesSecondSubset3[partitionSetId];
+ else if (subsetIndex == 2)
+ anchorIndex = anchorIndicesThirdSubset[partitionSetId];
+ }
+
+ for (deUint32 cpnt = 0; cpnt < 4; cpnt++)
+ {
+ endpointStart[cpnt] = endpoints[2 * subsetIndex][cpnt];
+ endpointEnd[cpnt] = endpoints[2 * subsetIndex + 1][cpnt];
+ }
+
+ {
+ const deUint32 colorInterpolationBits = indexBits[mode] + idxMode;
+ const deUint32 colorIndexBits = colorInterpolationBits - ((anchorIndex == pixel) ? 1 : 0);
+ const deUint32 alphaInterpolationBits = mode == 4 ? 3 - idxMode : (mode == 5 ? 2 : colorInterpolationBits);
+ const deUint32 alphaIndexBits = alphaInterpolationBits - ((anchorIndex == pixel) ? 1 : 0);
+ const deUint32 colorIdx = getBits128(low, high, colorIdxOffset, colorIdxOffset + colorIndexBits - 1);
+ const deUint32 alphaIdx = (mode == 4 || mode == 5) ? getBits128(low, high, alphaIdxOffset, alphaIdxOffset + alphaIndexBits - 1) : colorIdx;
+ const deUint32 r = interpolate(endpointStart[0], endpointEnd[0], colorIdx, colorInterpolationBits);
+ const deUint32 g = interpolate(endpointStart[1], endpointEnd[1], colorIdx, colorInterpolationBits);
+ const deUint32 b = interpolate(endpointStart[2], endpointEnd[2], colorIdx, colorInterpolationBits);
+ const deUint32 a = interpolate(endpointStart[3], endpointEnd[3], alphaIdx, alphaInterpolationBits);
+
+ colorIdxOffset += colorIndexBits;
+ alphaIdxOffset += alphaIndexBits;
+
+ if ((mode == 4 || mode == 5) && rotation != 0)
+ {
+ if (rotation == 1)
+ *dstPixel = a | (g << 8) | (b << 16) | (r << 24);
+ else if (rotation == 2)
+ *dstPixel = r | (a << 8) | (b << 16) | (g << 24);
+ else
+ *dstPixel = r | (g << 8) | (a << 16) | (b << 24);
+ }
+ else
+ {
+ *dstPixel = r | (g << 8) | (b << 16) | (a << 24);
+ }
+ }
+ }
+ }
+}
+
void decompressBlock (CompressedTexFormat format, const PixelBufferAccess& dst, const deUint8* src, const TexDecompressionParams& params)
{
// No 3D blocks supported right now
astc::decompress(dst, src, format, params.astcMode);
break;
+ case COMPRESSEDTEXFORMAT_BC1_RGB_UNORM_BLOCK: decompressBc1 (dst, src, false); break;
+ case COMPRESSEDTEXFORMAT_BC1_RGB_SRGB_BLOCK: decompressBc1 (dst, src, false); break;
+ case COMPRESSEDTEXFORMAT_BC1_RGBA_UNORM_BLOCK: decompressBc1 (dst, src, true); break;
+ case COMPRESSEDTEXFORMAT_BC1_RGBA_SRGB_BLOCK: decompressBc1 (dst, src, true); break;
+ case COMPRESSEDTEXFORMAT_BC2_UNORM_BLOCK: decompressBc2 (dst, src); break;
+ case COMPRESSEDTEXFORMAT_BC2_SRGB_BLOCK: decompressBc2 (dst, src); break;
+ case COMPRESSEDTEXFORMAT_BC3_UNORM_BLOCK: decompressBc3 (dst, src); break;
+ case COMPRESSEDTEXFORMAT_BC3_SRGB_BLOCK: decompressBc3 (dst, src); break;
+ case COMPRESSEDTEXFORMAT_BC4_UNORM_BLOCK: decompressBc4 (dst, src, false); break;
+ case COMPRESSEDTEXFORMAT_BC4_SNORM_BLOCK: decompressBc4 (dst, src, true); break;
+ case COMPRESSEDTEXFORMAT_BC5_UNORM_BLOCK: decompressBc5 (dst, src, false); break;
+ case COMPRESSEDTEXFORMAT_BC5_SNORM_BLOCK: decompressBc5 (dst, src, true); break;
+ case COMPRESSEDTEXFORMAT_BC6H_UFLOAT_BLOCK: decompressBc6H (dst, src, false); break;
+ case COMPRESSEDTEXFORMAT_BC6H_SFLOAT_BLOCK: decompressBc6H (dst, src, true); break;
+ case COMPRESSEDTEXFORMAT_BC7_UNORM_BLOCK: decompressBc7 (dst, src); break;
+ case COMPRESSEDTEXFORMAT_BC7_SRGB_BLOCK: decompressBc7 (dst, src); break;
+
default:
- DE_ASSERT(false);
+ DE_FATAL("Unexpected format");
break;
}
}