ThirdParty/Squish/clusterfit.cpp

*2f083884Ss.makeev_local/* -----------------------------------------------------------------------------
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	Copyright (c) 2006 Simon Brown                          [email protected]
*2f083884Ss.makeev_local	Copyright (c) 2007 Ignacio Castano                   [email protected]
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	Permission is hereby granted, free of charge, to any person obtaining
*2f083884Ss.makeev_local	a copy of this software and associated documentation files (the
*2f083884Ss.makeev_local	"Software"), to	deal in the Software without restriction, including
*2f083884Ss.makeev_local	without limitation the rights to use, copy, modify, merge, publish,
*2f083884Ss.makeev_local	distribute, sublicense, and/or sell copies of the Software, and to
*2f083884Ss.makeev_local	permit persons to whom the Software is furnished to do so, subject to
*2f083884Ss.makeev_local	the following conditions:
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	The above copyright notice and this permission notice shall be included
*2f083884Ss.makeev_local	in all copies or substantial portions of the Software.
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
*2f083884Ss.makeev_local	OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
*2f083884Ss.makeev_local	MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
*2f083884Ss.makeev_local	IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
*2f083884Ss.makeev_local	CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
*2f083884Ss.makeev_local	TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
*2f083884Ss.makeev_local	SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local   -------------------------------------------------------------------------- */
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local#include "clusterfit.h"
*2f083884Ss.makeev_local#include "colourset.h"
*2f083884Ss.makeev_local#include "colourblock.h"
*2f083884Ss.makeev_local#include <cfloat>
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localnamespace squish {
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localClusterFit::ClusterFit( ColourSet const* colours, int flags )
*2f083884Ss.makeev_local  : ColourFit( colours, flags )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// set the iteration count
*2f083884Ss.makeev_local	m_iterationCount = ( m_flags & kColourIterativeClusterFit ) ? kMaxIterations : 1;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// initialise the best error
*2f083884Ss.makeev_local	m_besterror = VEC4_CONST( FLT_MAX );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// initialise the metric
*2f083884Ss.makeev_local	bool perceptual = ( ( m_flags & kColourMetricPerceptual ) != 0 );
*2f083884Ss.makeev_local	if( perceptual )
*2f083884Ss.makeev_local		m_metric = Vec4( 0.2126f, 0.7152f, 0.0722f, 0.0f );
*2f083884Ss.makeev_local	else
*2f083884Ss.makeev_local		m_metric = VEC4_CONST( 1.0f );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// cache some values
*2f083884Ss.makeev_local	int const count = m_colours->GetCount();
*2f083884Ss.makeev_local	Vec3 const* values = m_colours->GetPoints();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// get the covariance matrix
*2f083884Ss.makeev_local	Sym3x3 covariance = ComputeWeightedCovariance( count, values, m_colours->GetWeights() );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// compute the principle component
*2f083884Ss.makeev_local	m_principle = ComputePrincipleComponent( covariance );
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localbool ClusterFit::ConstructOrdering( Vec3 const& axis, int iteration )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// cache some values
*2f083884Ss.makeev_local	int const count = m_colours->GetCount();
*2f083884Ss.makeev_local	Vec3 const* values = m_colours->GetPoints();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// build the list of dot products
*2f083884Ss.makeev_local	float dps[16];
*2f083884Ss.makeev_local	u8* order = ( u8* )m_order + 16*iteration;
*2f083884Ss.makeev_local	for( int i = 0; i < count; ++i )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		dps[i] = Dot( values[i], axis );
*2f083884Ss.makeev_local		order[i] = ( u8 )i;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// stable sort using them
*2f083884Ss.makeev_local	for( int i = 0; i < count; ++i )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		for( int j = i; j > 0 && dps[j] < dps[j - 1]; --j )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			std::swap( dps[j], dps[j - 1] );
*2f083884Ss.makeev_local			std::swap( order[j], order[j - 1] );
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// check this ordering is unique
*2f083884Ss.makeev_local	for( int it = 0; it < iteration; ++it )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		u8 const* prev = ( u8* )m_order + 16*it;
*2f083884Ss.makeev_local		bool same = true;
*2f083884Ss.makeev_local		for( int i = 0; i < count; ++i )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			if( order[i] != prev[i] )
*2f083884Ss.makeev_local			{
*2f083884Ss.makeev_local				same = false;
*2f083884Ss.makeev_local				break;
*2f083884Ss.makeev_local			}
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local		if( same )
*2f083884Ss.makeev_local			return false;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// copy the ordering and weight all the points
*2f083884Ss.makeev_local	Vec3 const* unweighted = m_colours->GetPoints();
*2f083884Ss.makeev_local	float const* weights = m_colours->GetWeights();
*2f083884Ss.makeev_local	m_xsum_wsum = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local	for( int i = 0; i < count; ++i )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		int j = order[i];
*2f083884Ss.makeev_local		Vec4 p( unweighted[j].X(), unweighted[j].Y(), unweighted[j].Z(), 1.0f );
*2f083884Ss.makeev_local		Vec4 w( weights[j] );
*2f083884Ss.makeev_local		Vec4 x = p*w;
*2f083884Ss.makeev_local		m_points_weights[i] = x;
*2f083884Ss.makeev_local		m_xsum_wsum += x;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local	return true;
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localvoid ClusterFit::Compress3( void* block )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// declare variables
*2f083884Ss.makeev_local	int const count = m_colours->GetCount();
*2f083884Ss.makeev_local	Vec4 const two = VEC4_CONST( 2.0 );
*2f083884Ss.makeev_local	Vec4 const one = VEC4_CONST( 1.0f );
*2f083884Ss.makeev_local	Vec4 const half_half2( 0.5f, 0.5f, 0.5f, 0.25f );
*2f083884Ss.makeev_local	Vec4 const zero = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local	Vec4 const half = VEC4_CONST( 0.5f );
*2f083884Ss.makeev_local	Vec4 const grid( 31.0f, 63.0f, 31.0f, 0.0f );
*2f083884Ss.makeev_local	Vec4 const gridrcp( 1.0f/31.0f, 1.0f/63.0f, 1.0f/31.0f, 0.0f );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// prepare an ordering using the principle axis
*2f083884Ss.makeev_local	ConstructOrdering( m_principle, 0 );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// check all possible clusters and iterate on the total order
*2f083884Ss.makeev_local	Vec4 beststart = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local	Vec4 bestend = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local	Vec4 besterror = m_besterror;
*2f083884Ss.makeev_local	u8 bestindices[16];
*2f083884Ss.makeev_local	int bestiteration = 0;
*2f083884Ss.makeev_local	int besti = 0, bestj = 0;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// loop over iterations (we avoid the case that all points in first or last cluster)
*2f083884Ss.makeev_local	for( int iterationIndex = 0;; )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// first cluster [0,i) is at the start
*2f083884Ss.makeev_local		Vec4 part0 = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local		for( int i = 0; i < count; ++i )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			// second cluster [i,j) is half along
*2f083884Ss.makeev_local			Vec4 part1 = ( i == 0 ) ? m_points_weights[0] : VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local			int jmin = ( i == 0 ) ? 1 : i;
*2f083884Ss.makeev_local			for( int j = jmin;; )
*2f083884Ss.makeev_local			{
*2f083884Ss.makeev_local				// last cluster [j,count) is at the end
*2f083884Ss.makeev_local				Vec4 part2 = m_xsum_wsum - part1 - part0;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				// compute least squares terms directly
*2f083884Ss.makeev_local				Vec4 alphax_sum = MultiplyAdd( part1, half_half2, part0 );
*2f083884Ss.makeev_local				Vec4 alpha2_sum = alphax_sum.SplatW();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				Vec4 betax_sum = MultiplyAdd( part1, half_half2, part2 );
*2f083884Ss.makeev_local				Vec4 beta2_sum = betax_sum.SplatW();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				Vec4 alphabeta_sum = ( part1*half_half2 ).SplatW();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				// compute the least-squares optimal points
*2f083884Ss.makeev_local				Vec4 factor = Reciprocal( NegativeMultiplySubtract( alphabeta_sum, alphabeta_sum, alpha2_sum*beta2_sum ) );
*2f083884Ss.makeev_local				Vec4 a = NegativeMultiplySubtract( betax_sum, alphabeta_sum, alphax_sum*beta2_sum )*factor;
*2f083884Ss.makeev_local				Vec4 b = NegativeMultiplySubtract( alphax_sum, alphabeta_sum, betax_sum*alpha2_sum )*factor;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				// clamp to the grid
*2f083884Ss.makeev_local				a = Min( one, Max( zero, a ) );
*2f083884Ss.makeev_local				b = Min( one, Max( zero, b ) );
*2f083884Ss.makeev_local				a = Truncate( MultiplyAdd( grid, a, half ) )*gridrcp;
*2f083884Ss.makeev_local				b = Truncate( MultiplyAdd( grid, b, half ) )*gridrcp;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				// compute the error (we skip the constant xxsum)
*2f083884Ss.makeev_local				Vec4 e1 = MultiplyAdd( a*a, alpha2_sum, b*b*beta2_sum );
*2f083884Ss.makeev_local				Vec4 e2 = NegativeMultiplySubtract( a, alphax_sum, a*b*alphabeta_sum );
*2f083884Ss.makeev_local				Vec4 e3 = NegativeMultiplySubtract( b, betax_sum, e2 );
*2f083884Ss.makeev_local				Vec4 e4 = MultiplyAdd( two, e3, e1 );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				// apply the metric to the error term
*2f083884Ss.makeev_local				Vec4 e5 = e4*m_metric;
*2f083884Ss.makeev_local				Vec4 error = e5.SplatX() + e5.SplatY() + e5.SplatZ();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				// keep the solution if it wins
*2f083884Ss.makeev_local				if( CompareAnyLessThan( error, besterror ) )
*2f083884Ss.makeev_local				{
*2f083884Ss.makeev_local					beststart = a;
*2f083884Ss.makeev_local					bestend = b;
*2f083884Ss.makeev_local					besti = i;
*2f083884Ss.makeev_local					bestj = j;
*2f083884Ss.makeev_local					besterror = error;
*2f083884Ss.makeev_local					bestiteration = iterationIndex;
*2f083884Ss.makeev_local				}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				// advance
*2f083884Ss.makeev_local				if( j == count )
*2f083884Ss.makeev_local					break;
*2f083884Ss.makeev_local				part1 += m_points_weights[j];
*2f083884Ss.makeev_local				++j;
*2f083884Ss.makeev_local			}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local			// advance
*2f083884Ss.makeev_local			part0 += m_points_weights[i];
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// stop if we didn't improve in this iteration
*2f083884Ss.makeev_local		if( bestiteration != iterationIndex )
*2f083884Ss.makeev_local			break;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// advance if possible
*2f083884Ss.makeev_local		++iterationIndex;
*2f083884Ss.makeev_local		if( iterationIndex == m_iterationCount )
*2f083884Ss.makeev_local			break;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// stop if a new iteration is an ordering that has already been tried
*2f083884Ss.makeev_local		Vec3 axis = ( bestend - beststart ).GetVec3();
*2f083884Ss.makeev_local		if( !ConstructOrdering( axis, iterationIndex ) )
*2f083884Ss.makeev_local			break;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// save the block if necessary
*2f083884Ss.makeev_local	if( CompareAnyLessThan( besterror, m_besterror ) )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// remap the indices
*2f083884Ss.makeev_local		u8 const* order = ( u8* )m_order + 16*bestiteration;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		u8 unordered[16];
*2f083884Ss.makeev_local		for( int m = 0; m < besti; ++m )
*2f083884Ss.makeev_local			unordered[order[m]] = 0;
*2f083884Ss.makeev_local		for( int m = besti; m < bestj; ++m )
*2f083884Ss.makeev_local			unordered[order[m]] = 2;
*2f083884Ss.makeev_local		for( int m = bestj; m < count; ++m )
*2f083884Ss.makeev_local			unordered[order[m]] = 1;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		m_colours->RemapIndices( unordered, bestindices );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// save the block
*2f083884Ss.makeev_local		WriteColourBlock3( beststart.GetVec3(), bestend.GetVec3(), bestindices, block );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// save the error
*2f083884Ss.makeev_local		m_besterror = besterror;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_localvoid ClusterFit::Compress4( void* block )
*2f083884Ss.makeev_local{
*2f083884Ss.makeev_local	// declare variables
*2f083884Ss.makeev_local	int const count = m_colours->GetCount();
*2f083884Ss.makeev_local	Vec4 const two = VEC4_CONST( 2.0f );
*2f083884Ss.makeev_local	Vec4 const one = VEC4_CONST( 1.0f );
*2f083884Ss.makeev_local	Vec4 const onethird_onethird2( 1.0f/3.0f, 1.0f/3.0f, 1.0f/3.0f, 1.0f/9.0f );
*2f083884Ss.makeev_local	Vec4 const twothirds_twothirds2( 2.0f/3.0f, 2.0f/3.0f, 2.0f/3.0f, 4.0f/9.0f );
*2f083884Ss.makeev_local	Vec4 const twonineths = VEC4_CONST( 2.0f/9.0f );
*2f083884Ss.makeev_local	Vec4 const zero = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local	Vec4 const half = VEC4_CONST( 0.5f );
*2f083884Ss.makeev_local	Vec4 const grid( 31.0f, 63.0f, 31.0f, 0.0f );
*2f083884Ss.makeev_local	Vec4 const gridrcp( 1.0f/31.0f, 1.0f/63.0f, 1.0f/31.0f, 0.0f );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// prepare an ordering using the principle axis
*2f083884Ss.makeev_local	ConstructOrdering( m_principle, 0 );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// check all possible clusters and iterate on the total order
*2f083884Ss.makeev_local	Vec4 beststart = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local	Vec4 bestend = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local	Vec4 besterror = m_besterror;
*2f083884Ss.makeev_local	u8 bestindices[16];
*2f083884Ss.makeev_local	int bestiteration = 0;
*2f083884Ss.makeev_local	int besti = 0, bestj = 0, bestk = 0;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// loop over iterations (we avoid the case that all points in first or last cluster)
*2f083884Ss.makeev_local	for( int iterationIndex = 0;; )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// first cluster [0,i) is at the start
*2f083884Ss.makeev_local		Vec4 part0 = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local		for( int i = 0; i < count; ++i )
*2f083884Ss.makeev_local		{
*2f083884Ss.makeev_local			// second cluster [i,j) is one third along
*2f083884Ss.makeev_local			Vec4 part1 = VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local			for( int j = i;; )
*2f083884Ss.makeev_local			{
*2f083884Ss.makeev_local				// third cluster [j,k) is two thirds along
*2f083884Ss.makeev_local				Vec4 part2 = ( j == 0 ) ? m_points_weights[0] : VEC4_CONST( 0.0f );
*2f083884Ss.makeev_local				int kmin = ( j == 0 ) ? 1 : j;
*2f083884Ss.makeev_local				for( int k = kmin;; )
*2f083884Ss.makeev_local				{
*2f083884Ss.makeev_local					// last cluster [k,count) is at the end
*2f083884Ss.makeev_local					Vec4 part3 = m_xsum_wsum - part2 - part1 - part0;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local					// compute least squares terms directly
*2f083884Ss.makeev_local					Vec4 const alphax_sum = MultiplyAdd( part2, onethird_onethird2, MultiplyAdd( part1, twothirds_twothirds2, part0 ) );
*2f083884Ss.makeev_local					Vec4 const alpha2_sum = alphax_sum.SplatW();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local					Vec4 const betax_sum = MultiplyAdd( part1, onethird_onethird2, MultiplyAdd( part2, twothirds_twothirds2, part3 ) );
*2f083884Ss.makeev_local					Vec4 const beta2_sum = betax_sum.SplatW();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local					Vec4 const alphabeta_sum = twonineths*( part1 + part2 ).SplatW();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local					// compute the least-squares optimal points
*2f083884Ss.makeev_local					Vec4 factor = Reciprocal( NegativeMultiplySubtract( alphabeta_sum, alphabeta_sum, alpha2_sum*beta2_sum ) );
*2f083884Ss.makeev_local					Vec4 a = NegativeMultiplySubtract( betax_sum, alphabeta_sum, alphax_sum*beta2_sum )*factor;
*2f083884Ss.makeev_local					Vec4 b = NegativeMultiplySubtract( alphax_sum, alphabeta_sum, betax_sum*alpha2_sum )*factor;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local					// clamp to the grid
*2f083884Ss.makeev_local					a = Min( one, Max( zero, a ) );
*2f083884Ss.makeev_local					b = Min( one, Max( zero, b ) );
*2f083884Ss.makeev_local					a = Truncate( MultiplyAdd( grid, a, half ) )*gridrcp;
*2f083884Ss.makeev_local					b = Truncate( MultiplyAdd( grid, b, half ) )*gridrcp;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local					// compute the error (we skip the constant xxsum)
*2f083884Ss.makeev_local					Vec4 e1 = MultiplyAdd( a*a, alpha2_sum, b*b*beta2_sum );
*2f083884Ss.makeev_local					Vec4 e2 = NegativeMultiplySubtract( a, alphax_sum, a*b*alphabeta_sum );
*2f083884Ss.makeev_local					Vec4 e3 = NegativeMultiplySubtract( b, betax_sum, e2 );
*2f083884Ss.makeev_local					Vec4 e4 = MultiplyAdd( two, e3, e1 );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local					// apply the metric to the error term
*2f083884Ss.makeev_local					Vec4 e5 = e4*m_metric;
*2f083884Ss.makeev_local					Vec4 error = e5.SplatX() + e5.SplatY() + e5.SplatZ();
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local					// keep the solution if it wins
*2f083884Ss.makeev_local					if( CompareAnyLessThan( error, besterror ) )
*2f083884Ss.makeev_local					{
*2f083884Ss.makeev_local						beststart = a;
*2f083884Ss.makeev_local						bestend = b;
*2f083884Ss.makeev_local						besterror = error;
*2f083884Ss.makeev_local						besti = i;
*2f083884Ss.makeev_local						bestj = j;
*2f083884Ss.makeev_local						bestk = k;
*2f083884Ss.makeev_local						bestiteration = iterationIndex;
*2f083884Ss.makeev_local					}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local					// advance
*2f083884Ss.makeev_local					if( k == count )
*2f083884Ss.makeev_local						break;
*2f083884Ss.makeev_local					part2 += m_points_weights[k];
*2f083884Ss.makeev_local					++k;
*2f083884Ss.makeev_local				}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local				// advance
*2f083884Ss.makeev_local				if( j == count )
*2f083884Ss.makeev_local					break;
*2f083884Ss.makeev_local				part1 += m_points_weights[j];
*2f083884Ss.makeev_local				++j;
*2f083884Ss.makeev_local			}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local			// advance
*2f083884Ss.makeev_local			part0 += m_points_weights[i];
*2f083884Ss.makeev_local		}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// stop if we didn't improve in this iteration
*2f083884Ss.makeev_local		if( bestiteration != iterationIndex )
*2f083884Ss.makeev_local			break;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// advance if possible
*2f083884Ss.makeev_local		++iterationIndex;
*2f083884Ss.makeev_local		if( iterationIndex == m_iterationCount )
*2f083884Ss.makeev_local			break;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// stop if a new iteration is an ordering that has already been tried
*2f083884Ss.makeev_local		Vec3 axis = ( bestend - beststart ).GetVec3();
*2f083884Ss.makeev_local		if( !ConstructOrdering( axis, iterationIndex ) )
*2f083884Ss.makeev_local			break;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local	// save the block if necessary
*2f083884Ss.makeev_local	if( CompareAnyLessThan( besterror, m_besterror ) )
*2f083884Ss.makeev_local	{
*2f083884Ss.makeev_local		// remap the indices
*2f083884Ss.makeev_local		u8 const* order = ( u8* )m_order + 16*bestiteration;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		u8 unordered[16];
*2f083884Ss.makeev_local		for( int m = 0; m < besti; ++m )
*2f083884Ss.makeev_local			unordered[order[m]] = 0;
*2f083884Ss.makeev_local		for( int m = besti; m < bestj; ++m )
*2f083884Ss.makeev_local			unordered[order[m]] = 2;
*2f083884Ss.makeev_local		for( int m = bestj; m < bestk; ++m )
*2f083884Ss.makeev_local			unordered[order[m]] = 3;
*2f083884Ss.makeev_local		for( int m = bestk; m < count; ++m )
*2f083884Ss.makeev_local			unordered[order[m]] = 1;
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		m_colours->RemapIndices( unordered, bestindices );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// save the block
*2f083884Ss.makeev_local		WriteColourBlock4( beststart.GetVec3(), bestend.GetVec3(), bestindices, block );
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local		// save the error
*2f083884Ss.makeev_local		m_besterror = besterror;
*2f083884Ss.makeev_local	}
*2f083884Ss.makeev_local}
*2f083884Ss.makeev_local
*2f083884Ss.makeev_local} // namespace squish