ThirdParty/Squish/alpha.cpp

*2f083884Ss.makeev_local/* -----------------------------------------------------------------------------
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	Copyright (c) 2006 Simon Brown                          [email protected]
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	Permission is hereby granted, free of charge, to any person obtaining
*2f083884Ss.makeev_local	a copy of this software and associated documentation files (the
*2f083884Ss.makeev_local	"Software"), to	deal in the Software without restriction, including
*2f083884Ss.makeev_local	without limitation the rights to use, copy, modify, merge, publish,
*2f083884Ss.makeev_local	distribute, sublicense, and/or sell copies of the Software, and to
*2f083884Ss.makeev_local	permit persons to whom the Software is furnished to do so, subject to
*2f083884Ss.makeev_local	the following conditions:
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	The above copyright notice and this permission notice shall be included
*2f083884Ss.makeev_local	in all copies or substantial portions of the Software.
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
*2f083884Ss.makeev_local	OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
*2f083884Ss.makeev_local	MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
*2f083884Ss.makeev_local	IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
*2f083884Ss.makeev_local	CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
*2f083884Ss.makeev_local	TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
*2f083884Ss.makeev_local	SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local   -------------------------------------------------------------------------- */
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local#include "alpha.h"
*2f083884Ss.makeev_local#include <algorithm>
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localnamespace squish {
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localstatic int FloatToInt( float a, int limit )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// use ANSI round-to-zero behaviour to get round-to-nearest
*2f083884Ss.makeev_local	int i = ( int )( a + 0.5f );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// clamp to the limit
*2f083884Ss.makeev_local	if( i < 0 )
*2f083884Ss.makeev_local		i = 0;
*2f083884Ss.makeev_local	else if( i > limit )
*2f083884Ss.makeev_local		i = limit;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// done
*2f083884Ss.makeev_local	return i;
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localvoid CompressAlphaDxt3( u8 const* rgba, int mask, void* block )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	u8* bytes = reinterpret_cast< u8* >( block );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// quantise and pack the alpha values pairwise
*2f083884Ss.makeev_local	for( int i = 0; i < 8; ++i )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// quantise down to 4 bits
*2f083884Ss.makeev_local		float alpha1 = ( float )rgba[8*i + 3] * ( 15.0f/255.0f );
*2f083884Ss.makeev_local		float alpha2 = ( float )rgba[8*i + 7] * ( 15.0f/255.0f );
*2f083884Ss.makeev_local		int quant1 = FloatToInt( alpha1, 15 );
*2f083884Ss.makeev_local		int quant2 = FloatToInt( alpha2, 15 );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// set alpha to zero where masked
*2f083884Ss.makeev_local		int bit1 = 1 << ( 2*i );
*2f083884Ss.makeev_local		int bit2 = 1 << ( 2*i + 1 );
*2f083884Ss.makeev_local		if( ( mask & bit1 ) == 0 )
*2f083884Ss.makeev_local			quant1 = 0;
*2f083884Ss.makeev_local		if( ( mask & bit2 ) == 0 )
*2f083884Ss.makeev_local			quant2 = 0;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// pack into the byte
*2f083884Ss.makeev_local		bytes[i] = ( u8 )( quant1 | ( quant2 << 4 ) );
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localvoid DecompressAlphaDxt3( u8* rgba, void const* block )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	u8 const* bytes = reinterpret_cast< u8 const* >( block );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// unpack the alpha values pairwise
*2f083884Ss.makeev_local	for( int i = 0; i < 8; ++i )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// quantise down to 4 bits
*2f083884Ss.makeev_local		u8 quant = bytes[i];
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// unpack the values
*2f083884Ss.makeev_local		u8 lo = quant & 0x0f;
*2f083884Ss.makeev_local		u8 hi = quant & 0xf0;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// convert back up to bytes
*2f083884Ss.makeev_local		rgba[8*i + 3] = lo | ( lo << 4 );
*2f083884Ss.makeev_local		rgba[8*i + 7] = hi | ( hi >> 4 );
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localstatic void FixRange( int& min, int& max, int steps )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	if( max - min < steps )
*2f083884Ss.makeev_local		max = std::min( min + steps, 255 );
*2f083884Ss.makeev_local	if( max - min < steps )
*2f083884Ss.makeev_local		min = std::max( 0, max - steps );
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localstatic int FitCodes( u8 const* rgba, int mask, u8 const* codes, u8* indices )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// fit each alpha value to the codebook
*2f083884Ss.makeev_local	int err = 0;
*2f083884Ss.makeev_local	for( int i = 0; i < 16; ++i )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// check this pixel is valid
*2f083884Ss.makeev_local		int bit = 1 << i;
*2f083884Ss.makeev_local		if( ( mask & bit ) == 0 )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			// use the first code
*2f083884Ss.makeev_local			indices[i] = 0;
*2f083884Ss.makeev_local			continue;
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// find the least error and corresponding index
*2f083884Ss.makeev_local		int value = rgba[4*i + 3];
*2f083884Ss.makeev_local		int least = 2000000000;//INT_MAX;
*2f083884Ss.makeev_local		int index = 0;
*2f083884Ss.makeev_local		for( int j = 0; j < 8; ++j )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			// get the squared error from this code
*2f083884Ss.makeev_local			int dist = ( int )value - ( int )codes[j];
*2f083884Ss.makeev_local			dist *= dist;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local			// compare with the best so far
*2f083884Ss.makeev_local			if( dist < least )
*2f083884Ss.makeev_local			{
*2f083884Ss.makeev_local				least = dist;
*2f083884Ss.makeev_local				index = j;
*2f083884Ss.makeev_local			}
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// save this index and accumulate the error
*2f083884Ss.makeev_local		indices[i] = ( u8 )index;
*2f083884Ss.makeev_local		err += least;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// return the total error
*2f083884Ss.makeev_local	return err;
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localstatic void WriteAlphaBlock( int alpha0, int alpha1, u8 const* indices, void* block )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	u8* bytes = reinterpret_cast< u8* >( block );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// write the first two bytes
*2f083884Ss.makeev_local	bytes[0] = ( u8 )alpha0;
*2f083884Ss.makeev_local	bytes[1] = ( u8 )alpha1;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// pack the indices with 3 bits each
*2f083884Ss.makeev_local	u8* dest = bytes + 2;
*2f083884Ss.makeev_local	u8 const* src = indices;
*2f083884Ss.makeev_local	for( int i = 0; i < 2; ++i )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// pack 8 3-bit values
*2f083884Ss.makeev_local		int value = 0;
*2f083884Ss.makeev_local		for( int j = 0; j < 8; ++j )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			int index = *src++;
*2f083884Ss.makeev_local			value |= ( index << 3*j );
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// store in 3 bytes
*2f083884Ss.makeev_local		for( int j = 0; j < 3; ++j )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			int byte = ( value >> 8*j ) & 0xff;
*2f083884Ss.makeev_local			*dest++ = ( u8 )byte;
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localstatic void WriteAlphaBlock5( int alpha0, int alpha1, u8 const* indices, void* block )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// check the relative values of the endpoints
*2f083884Ss.makeev_local	if( alpha0 > alpha1 )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// swap the indices
*2f083884Ss.makeev_local		u8 swapped[16];
*2f083884Ss.makeev_local		for( int i = 0; i < 16; ++i )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			u8 index = indices[i];
*2f083884Ss.makeev_local			if( index == 0 )
*2f083884Ss.makeev_local				swapped[i] = 1;
*2f083884Ss.makeev_local			else if( index == 1 )
*2f083884Ss.makeev_local				swapped[i] = 0;
*2f083884Ss.makeev_local			else if( index <= 5 )
*2f083884Ss.makeev_local				swapped[i] = 7 - index;
*2f083884Ss.makeev_local			else
*2f083884Ss.makeev_local				swapped[i] = index;
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// write the block
*2f083884Ss.makeev_local		WriteAlphaBlock( alpha1, alpha0, swapped, block );
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local	else
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// write the block
*2f083884Ss.makeev_local		WriteAlphaBlock( alpha0, alpha1, indices, block );
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localstatic void WriteAlphaBlock7( int alpha0, int alpha1, u8 const* indices, void* block )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// check the relative values of the endpoints
*2f083884Ss.makeev_local	if( alpha0 < alpha1 )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// swap the indices
*2f083884Ss.makeev_local		u8 swapped[16];
*2f083884Ss.makeev_local		for( int i = 0; i < 16; ++i )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			u8 index = indices[i];
*2f083884Ss.makeev_local			if( index == 0 )
*2f083884Ss.makeev_local				swapped[i] = 1;
*2f083884Ss.makeev_local			else if( index == 1 )
*2f083884Ss.makeev_local				swapped[i] = 0;
*2f083884Ss.makeev_local			else
*2f083884Ss.makeev_local				swapped[i] = 9 - index;
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// write the block
*2f083884Ss.makeev_local		WriteAlphaBlock( alpha1, alpha0, swapped, block );
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local	else
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// write the block
*2f083884Ss.makeev_local		WriteAlphaBlock( alpha0, alpha1, indices, block );
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localvoid CompressAlphaDxt5( u8 const* rgba, int mask, void* block )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// get the range for 5-alpha and 7-alpha interpolation
*2f083884Ss.makeev_local	int min5 = 255;
*2f083884Ss.makeev_local	int max5 = 0;
*2f083884Ss.makeev_local	int min7 = 255;
*2f083884Ss.makeev_local	int max7 = 0;
*2f083884Ss.makeev_local	for( int i = 0; i < 16; ++i )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// check this pixel is valid
*2f083884Ss.makeev_local		int bit = 1 << i;
*2f083884Ss.makeev_local		if( ( mask & bit ) == 0 )
*2f083884Ss.makeev_local			continue;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// incorporate into the min/max
*2f083884Ss.makeev_local		int value = rgba[4*i + 3];
*2f083884Ss.makeev_local		if( value < min7 )
*2f083884Ss.makeev_local			min7 = value;
*2f083884Ss.makeev_local		if( value > max7 )
*2f083884Ss.makeev_local			max7 = value;
*2f083884Ss.makeev_local		if( value != 0 && value < min5 )
*2f083884Ss.makeev_local			min5 = value;
*2f083884Ss.makeev_local		if( value != 255 && value > max5 )
*2f083884Ss.makeev_local			max5 = value;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// handle the case that no valid range was found
*2f083884Ss.makeev_local	if( min5 > max5 )
*2f083884Ss.makeev_local		min5 = max5;
*2f083884Ss.makeev_local	if( min7 > max7 )
*2f083884Ss.makeev_local		min7 = max7;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// fix the range to be the minimum in each case
*2f083884Ss.makeev_local	FixRange( min5, max5, 5 );
*2f083884Ss.makeev_local	FixRange( min7, max7, 7 );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// set up the 5-alpha code book
*2f083884Ss.makeev_local	u8 codes5[8];
*2f083884Ss.makeev_local	codes5[0] = ( u8 )min5;
*2f083884Ss.makeev_local	codes5[1] = ( u8 )max5;
*2f083884Ss.makeev_local	for( int i = 1; i < 5; ++i )
*2f083884Ss.makeev_local		codes5[1 + i] = ( u8 )( ( ( 5 - i )*min5 + i*max5 )/5 );
*2f083884Ss.makeev_local	codes5[6] = 0;
*2f083884Ss.makeev_local	codes5[7] = 255;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// set up the 7-alpha code book
*2f083884Ss.makeev_local	u8 codes7[8];
*2f083884Ss.makeev_local	codes7[0] = ( u8 )min7;
*2f083884Ss.makeev_local	codes7[1] = ( u8 )max7;
*2f083884Ss.makeev_local	for( int i = 1; i < 7; ++i )
*2f083884Ss.makeev_local		codes7[1 + i] = ( u8 )( ( ( 7 - i )*min7 + i*max7 )/7 );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// fit the data to both code books
*2f083884Ss.makeev_local	u8 indices5[16];
*2f083884Ss.makeev_local	u8 indices7[16];
*2f083884Ss.makeev_local	int err5 = FitCodes( rgba, mask, codes5, indices5 );
*2f083884Ss.makeev_local	int err7 = FitCodes( rgba, mask, codes7, indices7 );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// save the block with least error
*2f083884Ss.makeev_local	if( err5 <= err7 )
*2f083884Ss.makeev_local		WriteAlphaBlock5( min5, max5, indices5, block );
*2f083884Ss.makeev_local	else
*2f083884Ss.makeev_local		WriteAlphaBlock7( min7, max7, indices7, block );
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localvoid DecompressAlphaDxt5( u8* rgba, void const* block )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// get the two alpha values
*2f083884Ss.makeev_local	u8 const* bytes = reinterpret_cast< u8 const* >( block );
*2f083884Ss.makeev_local	int alpha0 = bytes[0];
*2f083884Ss.makeev_local	int alpha1 = bytes[1];
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// compare the values to build the codebook
*2f083884Ss.makeev_local	u8 codes[8];
*2f083884Ss.makeev_local	codes[0] = ( u8 )alpha0;
*2f083884Ss.makeev_local	codes[1] = ( u8 )alpha1;
*2f083884Ss.makeev_local	if( alpha0 <= alpha1 )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// use 5-alpha codebook
*2f083884Ss.makeev_local		for( int i = 1; i < 5; ++i )
*2f083884Ss.makeev_local			codes[1 + i] = ( u8 )( ( ( 5 - i )*alpha0 + i*alpha1 )/5 );
*2f083884Ss.makeev_local		codes[6] = 0;
*2f083884Ss.makeev_local		codes[7] = 255;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local	else
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// use 7-alpha codebook
*2f083884Ss.makeev_local		for( int i = 1; i < 7; ++i )
*2f083884Ss.makeev_local			codes[1 + i] = ( u8 )( ( ( 7 - i )*alpha0 + i*alpha1 )/7 );
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// decode the indices
*2f083884Ss.makeev_local	u8 indices[16];
*2f083884Ss.makeev_local	u8 const* src = bytes + 2;
*2f083884Ss.makeev_local	u8* dest = indices;
*2f083884Ss.makeev_local	for( int i = 0; i < 2; ++i )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// grab 3 bytes
*2f083884Ss.makeev_local		int value = 0;
*2f083884Ss.makeev_local		for( int j = 0; j < 3; ++j )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			int byte = *src++;
*2f083884Ss.makeev_local			value |= ( byte << 8*j );
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// unpack 8 3-bit values from it
*2f083884Ss.makeev_local		for( int j = 0; j < 8; ++j )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			int index = ( value >> 3*j ) & 0x7;
*2f083884Ss.makeev_local			*dest++ = ( u8 )index;
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// write out the indexed codebook values
*2f083884Ss.makeev_local	for( int i = 0; i < 16; ++i )
*2f083884Ss.makeev_local		rgba[4*i + 3] = codes[indices[i]];
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local} // namespace squish