id-Software
/
DOOM-3-BFG
镜像来自 https://github.com/id-Software/DOOM-3-BFG


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625
							/*
===========================================================================

Doom 3 BFG Edition GPL Source Code
Copyright (C) 1993-2012 id Software LLC, a ZeniMax Media company. 

This file is part of the Doom 3 BFG Edition GPL Source Code ("Doom 3 BFG Edition Source Code").  

Doom 3 BFG Edition Source Code is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.

Doom 3 BFG Edition Source Code is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with Doom 3 BFG Edition Source Code.  If not, see <http://www.gnu.org/licenses/>.

In addition, the Doom 3 BFG Edition Source Code is also subject to certain additional terms. You should have received a copy of these additional terms immediately following the terms and conditions of the GNU General Public License which accompanied the Doom 3 BFG Edition Source Code.  If not, please request a copy in writing from id Software at the address below.

If you have questions concerning this license or the applicable additional terms, you may contact in writing id Software LLC, c/o ZeniMax Media Inc., Suite 120, Rockville, Maryland 20850 USA.

===========================================================================
*/
#ifndef __DXTCODEC_H__
#define __DXTCODEC_H__

/*
================================================================================================
Contains the DxtEncoder and DxtDecoder declarations.
================================================================================================
*/

/*
================================================
idDxtEncoder encodes Images in a number of DXT formats. Raw input Images are assumed to be in
4-byte RGBA format. Raw input NormalMaps are assumed to be in 4-byte tangent-space NxNyNz format.

The supported formats are:
	* DXT1 = colors in 4x4 block approximated by equidistant points on a line through 3D space
	* DXT2 = DXT3 + colors are pre-multiplied by alpha
	* DXT3 = DXT1 + explicit 4-bit alpha
	* DXT4 = DXT5 + colors are pre-multiplied by alpha
	* DXT5 = DXT1 + alpha values in 4x4 block approximated by equidistant points on line through alpha space
	* CTX1 = colors in a 4x4 block approximated by equidistant points on a line through 2D space
	* DXN1 = one DXT5 alpha block (aka DXT5A, or ATI1N)
	* DXN2 = two DXT5 alpha blocks (aka 3Dc, or ATI2N)
================================================
*/
class idDxtEncoder {
public:
			idDxtEncoder() { srcPadding = dstPadding = 0; }
			~idDxtEncoder() {}

	void	SetSrcPadding( int pad ) { srcPadding = pad; }
	void	SetDstPadding( int pad ) { dstPadding = pad; }

	// high quality DXT1 compression (no alpha), uses exhaustive search to find a line through color space and is very slow
	void	CompressImageDXT1HQ( const byte *inBuf, byte *outBuf, int width, int height );
	
	// fast DXT1 compression (no alpha), for real-time use at the cost of a little quality
	void	CompressImageDXT1Fast( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressImageDXT1Fast_Generic( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressImageDXT1Fast_SSE2( const byte *inBuf, byte *outBuf, int width, int height );

	// high quality DXT1 compression (with alpha), uses exhaustive search to find a line through color space and is very slow
	void	CompressImageDXT1AlphaHQ( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }

	// fast DXT1 compression (with alpha), for real-time use at the cost of a little quality
	void	CompressImageDXT1AlphaFast( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressImageDXT1AlphaFast_Generic( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressImageDXT1AlphaFast_SSE2( const byte *inBuf, byte *outBuf, int width, int height );

	// high quality DXT5 compression, uses exhaustive search to find a line through color space and is generally
	// too slow to actually use for anything
	void	CompressImageDXT5HQ( const byte *inBuf, byte *outBuf, int width, int height );

	// fast DXT5 compression for real-time use at the cost of a little quality
	void	CompressImageDXT5Fast( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressImageDXT5Fast_Generic( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressImageDXT5Fast_SSE2( const byte *inBuf, byte *outBuf, int width, int height );

	// high quality CTX1 compression, uses exhaustive search to find a line through 2D space and is very slow
	void	CompressImageCTX1HQ( const byte *inBuf, byte *outBuf, int width, int height );

	// fast CTX1 compression for real-time use
	void	CompressImageCTX1Fast( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }
	void	CompressImageCTX1Fast_Generic( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }
	void	CompressImageCTX1Fast_SSE2( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }

	// high quality DXN1 (aka DXT5A or ATI1N) compression, uses exhaustive search to find a line through color space and is very slow
	void	CompressImageDXN1HQ( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }
	
	// fast single channel compression into, DXN1 (aka DXT5A or ATI1N) format, for real-time use
	void	CompressImageDXN1Fast( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressImageDXN1Fast_Generic( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressImageDXN1Fast_SSE2( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }

	// high quality YCoCg DXT5 compression, uses exhaustive search to find a line through color space and is very slow
	void	CompressYCoCgDXT5HQ( const byte *inBuf, byte *outBuf, int width, int height );
	
	// fast YCoCg DXT5 compression for real-time use (the input is expected to be in CoCg_Y format)
	void	CompressYCoCgDXT5Fast( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressYCoCgDXT5Fast_Generic( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressYCoCgDXT5Fast_SSE2( const byte *inBuf, byte *outBuf, int width, int height );

	// fast YCoCg-Alpha DXT5 compression for real-time use (the input is expected to be in CoCgAY format)
	void	CompressYCoCgAlphaDXT5Fast( const byte *inBuf, byte *outBuf, int width, int height );

	// high quality YCoCg CTX1 + DXT5A compression, uses exhaustive search to find a line through 2D space and is very slow
	void	CompressYCoCgCTX1DXT5AHQ( const byte *inBuf, byte *outBuf, int width, int height );

	// fast YCoCg CTX1 + DXT5A compression for real-time use (the input is expected to be in CoCg_Y format)
	void	CompressYCoCgCTX1DXT5AFast( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressYCoCgCTX1DXT5AFast_Generic( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressYCoCgCTX1DXT5AFast_SSE2( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }

	// high quality tangent space NxNyNz normal map compression into DXT1 format (Nz is not used)
	void	CompressNormalMapDXT1HQ( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressNormalMapDXT1RenormalizeHQ( const byte *inBuf, byte *outBuf, int width, int height );

	// fast tangent space NxNyNz normal map compression into DXT1 format (Nz is not used), for real-time use
	void	CompressNormalMapDXT1Fast( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }
	void	CompressNormalMapDXT1Fast_Generic( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }
	void	CompressNormalMapDXT1Fast_SSE2( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }

	// high quality tangent space _Ny_Nx normal map compression into DXT5 format
	void	CompressNormalMapDXT5HQ( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressNormalMapDXT5RenormalizeHQ( const byte *inBuf, byte *outBuf, int width, int height );

	// fast tangent space _Ny_Nx normal map compression into DXT5 format, for real-time use
	void	CompressNormalMapDXT5Fast( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressNormalMapDXT5Fast_Generic( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressNormalMapDXT5Fast_SSE2( const byte *inBuf, byte *outBuf, int width, int height );

	// high quality tangent space NxNy_ normal map compression into DXN2 (3Dc, ATI2N) format
	void	CompressNormalMapDXN2HQ( const byte *inBuf, byte *outBuf, int width, int height );
	
	// fast tangent space NxNy_ normal map compression into DXN2 (3Dc, ATI2N) format, for real-time use
	void	CompressNormalMapDXN2Fast( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressNormalMapDXN2Fast_Generic( const byte *inBuf, byte *outBuf, int width, int height );
	void	CompressNormalMapDXN2Fast_SSE2( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }

	// fast single channel conversion from DXN1 (aka DXT5A or ATI1N) to DXT1, reasonably fast (also works in-place)
	void	ConvertImageDXN1_DXT1( const byte *inBuf, byte *outBuf, int width, int height );
	
	// fast single channel conversion from DXT1 to DXN1 (aka DXT5A or ATI1N), reasonably fast (also works in-place)
	void	ConvertImageDXT1_DXN1( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }

	// fast tangent space NxNyNz normal map conversion from DXN (3Dc, ATI2N) to DXT5, reasonably fast (also works in-place)
	void	ConvertNormalMapDXN2_DXT5( const byte *inBuf, byte *outBuf, int width, int height );

	// fast tangent space NxNyNz normal map conversion DXT5 to DXN (3Dc, ATI2N), reasonably fast (also works in-place)
	void	ConvertNormalMapDXT5_DXN2( const byte *inBuf, byte *outBuf, int width, int height );

private:
	int					width;
	int					height;
	byte *				outData;
	int					srcPadding;
	int					dstPadding;

	void				EmitByte( byte b );
	void				EmitUShort( unsigned short s );
	void				EmitUInt( unsigned int i );
	unsigned int		AlphaDistance( const byte a1, const byte a2 ) const;
	unsigned int		ColorDistance( const byte *c1, const byte *c2 ) const;
	unsigned int		ColorDistanceWeighted( const byte *c1, const byte *c2 ) const;
	unsigned int		CTX1Distance( const byte *c1, const byte *c2 ) const;
	unsigned short		ColorTo565( const byte *color ) const;
	unsigned short		ColorTo565( byte r, byte g, byte b ) const;
	void				ColorFrom565( unsigned short c565, byte *color ) const;
	byte				GreenFrom565( unsigned short c565 ) const;

	void				NV4XHardwareBugFix( byte *minColor, byte *maxColor ) const;

	bool				HasConstantValuePer4x4Block( const byte *inBuf, int width, int height, int channel ) const;
	void				WriteTinyColorDXT1( const byte *inBuf, int width, int height );
	void				WriteTinyColorDXT5( const byte *inBuf, int width, int height );
	void				WriteTinyColorCTX1DXT5A( const byte *inBuf, int width, int height );
	void				WriteTinyNormalMapDXT5( const byte *NxNy, int width, int height );
	void				WriteTinyNormalMapDXN( const byte *NxNy, int width, int height );
	void				WriteTinyDXT5A( const byte *NxNy, int width, int height );

	void				GetMinMaxColorsMaxDist( const byte *colorBlock, byte *minColor, byte *maxColor ) const;
	void				GetMinMaxColorsLuminance( const byte *colorBlock, byte *minColor, byte *maxColor ) const;
	int					GetSquareAlphaError( const byte *colorBlock, const int alphaOffset, const byte minAlpha, const byte maxAlpha, int lastError ) const;
	int					GetMinMaxAlphaHQ( const byte *colorBlock, const int alphaOffset, byte *minColor, byte *maxColor ) const;
	int					GetSquareColorsError( const byte *colorBlock, const unsigned short color0, const unsigned short color1, int lastError ) const;
	int					GetMinMaxColorsHQ( const byte *colorBlock, byte *minColor, byte *maxColor, bool noBlack ) const;
	int					GetSquareCTX1Error( const byte *colorBlock, const byte *color0, const byte *color1, int lastError ) const;
	int					GetMinMaxCTX1HQ( const byte *colorBlock, byte *minColor, byte *maxColor ) const;
	int					GetSquareNormalYError( const byte *colorBlock, const unsigned short color0, const unsigned short color1, int lastError, int scale ) const;
	int					GetMinMaxNormalYHQ( const byte *colorBlock, byte *minColor, byte *maxColor, bool noBlack, int scale ) const;
	int					GetSquareNormalsDXT1Error( const int *colorBlock, const unsigned short color0, const unsigned short color1, int lastError, unsigned int &colorIndices ) const;
	int					GetMinMaxNormalsDXT1HQ( const byte *colorBlock, byte *minColor, byte *maxColor, unsigned int &colorIndices, bool noBlack ) const;
	int					GetSquareNormalsDXT5Error( const int *normalBlock, const byte *minNormal, const byte *maxNormal, int lastError, unsigned int &colorIndices, byte *alphaIndices ) const;
	int					GetMinMaxNormalsDXT5HQ( const byte *normalBlock, byte *minColor, byte *maxColor, unsigned int &colorIndices, byte *alphaIndices ) const;
	int					GetMinMaxNormalsDXT5HQFast( const byte *normalBlock, byte *minColor, byte *maxColor, unsigned int &colorIndices, byte *alphaIndices ) const;
	void				ScaleYCoCg( byte *colorBlock ) const;
	void				BiasScaleNormalY( byte *colorBlock ) const;
	void				RotateNormalsDXT1( byte *block ) const;
	void				RotateNormalsDXT5( byte *block ) const;
	int					FindColorIndices( const byte *colorBlock, const unsigned short color0, const unsigned short color1, unsigned int &result ) const;
	int					FindAlphaIndices( const byte *colorBlock, const int alphaOffset, const byte alpha0, const byte alpha1, byte *indexes ) const;
	int					FindCTX1Indices( const byte *colorBlock, const byte *color0, const byte *color1, unsigned int &result ) const;

	void				ExtractBlock( const byte *inPtr, int width, byte *colorBlock ) const;
	void				GetMinMaxBBox( const byte *colorBlock, byte *minColor, byte *maxColor ) const;
	void				InsetColorsBBox( byte *minColor, byte *maxColor ) const;
	void				SelectColorsDiagonal( const byte *colorBlock, byte *minColor, byte *maxColor ) const;
	void				ScaleYCoCg( byte *colorBlock, byte *minColor, byte *maxColor ) const;
	void				InsetYCoCgAlpaBBox( byte *minColor, byte *maxColor ) const;
	void				InsetYCoCgBBox( byte *minColor, byte *maxColor ) const;
	void				SelectYCoCgDiagonal( const byte *colorBlock, byte *minColor, byte *maxColor ) const;
	void				InsetNormalsBBoxDXT5( byte *minNormal, byte *maxNormal ) const;
	void				InsetNormalsBBox3Dc( byte *minNormal, byte *maxNormal ) const;
	void				EmitColorIndices( const byte *colorBlock, const byte *minColor, const byte *maxColor );
	void				EmitColorAlphaIndices( const byte *colorBlock, const byte *minColor, const byte *maxColor );
	void				EmitCTX1Indices( const byte *colorBlock, const byte *minColor, const byte *maxColor );
	void				EmitAlphaIndices( const byte *colorBlock, const int channel, const byte minAlpha, const byte maxAlpha );
	void				EmitGreenIndices( const byte *block, const int channel, const byte minGreen, const byte maxGreen );

	// Keeping the ASM versions to keep the performance of 32-bit debug builds reasonable.
	// The implementation using intrinsics is very slow in debug builds because registers are continuously spilled to memory.
	void				ExtractBlock_SSE2( const byte *inPtr, int width, byte *colorBlock ) const;
	void				GetMinMaxBBox_SSE2( const byte *colorBlock, byte *minColor, byte *maxColor ) const;
	void				InsetColorsBBox_SSE2( byte *minColor, byte *maxColor ) const;
	void				InsetNormalsBBoxDXT5_SSE2( byte *minNormal, byte *maxNormal ) const;
	void				EmitColorIndices_SSE2( const byte *colorBlock, const byte *minColor, const byte *maxColor );
	void				EmitColorAlphaIndices_SSE2( const byte *colorBlock, const byte *minColor, const byte *maxColor );
	void				EmitCoCgIndices_SSE2( const byte *colorBlock, const byte *minColor, const byte *maxColor );
	void				EmitAlphaIndices_SSE2( const byte *colorBlock, const int minAlpha, const int maxAlpha );
	void				EmitAlphaIndices_SSE2( const byte *colorBlock, const int channelBitOffset, const int minAlpha, const int maxAlpha );
	void				EmitGreenIndices_SSE2( const byte *block, const int channelBitOffset, const int minGreen, const int maxGreen );
	void				ScaleYCoCg_SSE2( byte *colorBlock, byte *minColor, byte *maxColor ) const;
	void				InsetYCoCgBBox_SSE2( byte *minColor, byte *maxColor ) const;
	void				SelectYCoCgDiagonal_SSE2( const byte *colorBlock, byte *minColor, byte *maxColor ) const;


	void				EmitNormalYIndices( const byte *normalBlock, const int offset, const byte minNormalY, const byte maxNormalY );
	void				EmitNormalYIndices_SSE2( const byte *normalBlock, const int offset, const byte minNormalY, const byte maxNormalY );

	void				DecodeDXNAlphaValues( const byte *inBuf, byte *values );
	void				EncodeDXNAlphaValues( byte *outBuf, const byte min, const byte max, const byte *values );

	void				DecodeNormalYValues( const byte *inBuf, byte &min, byte &max, byte *values );
	void				EncodeNormalRGBIndices( byte *outBuf, const byte min, const byte max, const byte *values );
};

/*
========================
idDxtEncoder::CompressImageDXT1Fast
========================
*/
ID_INLINE void idDxtEncoder::CompressImageDXT1Fast( const byte *inBuf, byte *outBuf, int width, int height ) {
#ifdef ID_WIN_X86_SSE2_INTRIN
	CompressImageDXT1Fast_SSE2( inBuf, outBuf, width, height );
#else
	CompressImageDXT1Fast_Generic( inBuf, outBuf, width, height );
#endif
}

/*
========================
idDxtEncoder::CompressImageDXT1AlphaFast
========================
*/
ID_INLINE void idDxtEncoder::CompressImageDXT1AlphaFast( const byte *inBuf, byte *outBuf, int width, int height ) {
#ifdef ID_WIN_X86_SSE2_INTRIN
	CompressImageDXT1AlphaFast_SSE2( inBuf, outBuf, width, height );
#else
	CompressImageDXT1AlphaFast_Generic( inBuf, outBuf, width, height );
#endif
}

/*
========================
idDxtEncoder::CompressImageDXT5Fast
========================
*/
ID_INLINE void idDxtEncoder::CompressImageDXT5Fast( const byte *inBuf, byte *outBuf, int width, int height ) {
#ifdef ID_WIN_X86_SSE2_INTRIN
	CompressImageDXT5Fast_SSE2( inBuf, outBuf, width, height );
#else
	CompressImageDXT5Fast_Generic( inBuf, outBuf, width, height );
#endif
}

/*
========================
idDxtEncoder::CompressImageDXN1Fast
========================
*/
ID_INLINE void idDxtEncoder::CompressImageDXN1Fast( const byte *inBuf, byte *outBuf, int width, int height ) {
	CompressImageDXN1Fast_Generic( inBuf, outBuf, width, height );
}

/*
========================
idDxtEncoder::CompressYCoCgDXT5Fast
========================
*/
ID_INLINE void idDxtEncoder::CompressYCoCgDXT5Fast( const byte *inBuf, byte *outBuf, int width, int height ) {
#ifdef ID_WIN_X86_SSE2_INTRIN
	CompressYCoCgDXT5Fast_SSE2( inBuf, outBuf, width, height );
#else
	CompressYCoCgDXT5Fast_Generic( inBuf, outBuf, width, height );
#endif
}

/*
========================
idDxtEncoder::CompressYCoCgCTX1DXT5AFast
========================
*/
ID_INLINE void idDxtEncoder::CompressYCoCgCTX1DXT5AFast( const byte *inBuf, byte *outBuf, int width, int height ) {
	CompressYCoCgCTX1DXT5AFast_Generic( inBuf, outBuf, width, height );
}

/*
========================
idDxtEncoder::CompressNormalMapDXT5Fast
========================
*/
ID_INLINE void idDxtEncoder::CompressNormalMapDXT5Fast( const byte *inBuf, byte *outBuf, int width, int height ) {
#ifdef ID_WIN_X86_SSE2_INTRIN
	CompressNormalMapDXT5Fast_SSE2( inBuf, outBuf, width, height );
#else
	CompressNormalMapDXT5Fast_Generic( inBuf, outBuf, width, height );
#endif
}

/*
========================
idDxtEncoder::CompressNormalMapDXN2Fast
========================
*/
ID_INLINE void idDxtEncoder::CompressNormalMapDXN2Fast( const byte *inBuf, byte *outBuf, int width, int height ) {
	CompressNormalMapDXN2Fast_Generic( inBuf, outBuf, width, height );
}

/*
========================
idDxtEncoder::EmitByte
========================
*/
ID_INLINE void idDxtEncoder::EmitByte( byte b ) {
	*outData = b;
	outData += 1;
}

/*
========================
idDxtEncoder::EmitUShort
========================
*/
ID_INLINE void idDxtEncoder::EmitUShort( unsigned short s ) {
	*((unsigned short *)outData) = s;
	outData += 2;
}

/*
========================
idDxtEncoder::EmitUInt
========================
*/
ID_INLINE void idDxtEncoder::EmitUInt( unsigned int i ) {
	*((unsigned int *)outData) = i;
	outData += 4;
}

/*
========================
idDxtEncoder::AlphaDistance
========================
*/
ID_INLINE unsigned int idDxtEncoder::AlphaDistance( const byte a1, const byte a2 ) const {
	return ( a1 - a2 ) * ( a1 - a2 );
}

/*
========================
idDxtEncoder::ColorDistance
========================
*/
ID_INLINE unsigned int idDxtEncoder::ColorDistance( const byte *c1, const byte *c2 ) const {
	return ( ( c1[ 0 ] - c2[ 0 ] ) * ( c1[ 0 ] - c2[ 0 ] ) ) + ( ( c1[ 1 ] - c2[ 1 ] ) * ( c1[ 1 ] - c2[ 1 ] ) ) + ( ( c1[ 2 ] - c2[ 2 ] ) * ( c1[ 2 ] - c2[ 2 ] ) );
}

/*
========================
idDxtEncoder::ColorDistanceWeighted
========================
*/
ID_INLINE unsigned int idDxtEncoder::ColorDistanceWeighted( const byte *c1, const byte *c2 ) const {
	int r, g, b;
	int rmean;

	// http://www.compuphase.com/cmetric.htm
	rmean = ( (int)c1[0] + (int)c2[0] ) / 2;
	r = (int)c1[0] - (int)c2[0];
	g = (int)c1[1] - (int)c2[1];
	b = (int)c1[2] - (int)c2[2];
	return ( ( ( 512 + rmean ) * r * r ) >> 8 ) + 4 * g * g + ( ( ( 767 - rmean ) * b * b ) >> 8 );
}

/*
========================
idDxtEncoder::CTX1Distance
========================
*/
ID_INLINE unsigned int idDxtEncoder::CTX1Distance( const byte *c1, const byte *c2 ) const {
	return ( ( c1[ 0 ] - c2[ 0 ] ) * ( c1[ 0 ] - c2[ 0 ] ) ) + ( ( c1[ 1 ] - c2[ 1 ] ) * ( c1[ 1 ] - c2[ 1 ] ) );
}

/*
========================
idDxtEncoder::ColorTo565
========================
*/
ID_INLINE unsigned short idDxtEncoder::ColorTo565( const byte *color ) const {
	return ( ( color[ 0 ] >> 3 ) << 11 ) | ( ( color[ 1 ] >> 2 ) << 5 ) | ( color[ 2 ] >> 3 );
}

/*
========================
idDxtEncoder::ColorFrom565
========================
*/
ID_INLINE void idDxtEncoder::ColorFrom565( unsigned short c565, byte *color ) const {
	color[0] = byte( ( ( c565 >> 8 ) & ( ( ( 1 << ( 8 - 3 ) ) - 1 ) << 3 ) ) | ( ( c565 >> 13 ) & ((1<<3)-1) ) );
	color[1] = byte( ( ( c565 >> 3 ) & ( ( ( 1 << ( 8 - 2 ) ) - 1 ) << 2 ) ) | ( ( c565 >>  9 ) & ((1<<2)-1) ) );
	color[2] = byte( ( ( c565 << 3 ) & ( ( ( 1 << ( 8 - 3 ) ) - 1 ) << 3 ) ) | ( ( c565 >>  2 ) & ((1<<3)-1) ) );
}

/*
========================
idDxtEncoder::ColorTo565
========================
*/
ID_INLINE unsigned short idDxtEncoder::ColorTo565( byte r, byte g, byte b ) const {
	return ( ( r >> 3 ) << 11 ) | ( ( g >> 2 ) << 5 ) | ( b >> 3 );
}

/*
========================
idDxtEncoder::GreenFrom565
========================
*/
ID_INLINE byte idDxtEncoder::GreenFrom565( unsigned short c565 ) const {
	byte c = byte( ( c565 & ( ( ( 1 << 6 ) - 1 ) << 5 ) ) >> 3 );
	return ( c | ( c >> 6 ) );
}

/*
================================================
idDxtDecoder decodes DXT-compressed Images. Raw output Images are in 
4-byte RGBA format. Raw output NormalMaps are in 4-byte tangent-space NxNyNz format.
================================================
*/
class idDxtDecoder {
public:	

	// DXT1 decompression (no alpha)
	void	DecompressImageDXT1( const byte *inBuf, byte *outBuf, int width, int height );

	// DXT5 decompression
	void	DecompressImageDXT5( const byte *inBuf, byte *outBuf, int width, int height );

	// DXT5 decompression with nVidia 7x hardware bug
	void	DecompressImageDXT5_nVidia7x( const byte *inBuf, byte *outBuf, int width, int height );

	// CTX1
	void	DecompressImageCTX1( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }

	// DXN1
	void	DecompressImageDXN1( const byte *inBuf, byte *outBuf, int width, int height ) { /* not implemented */ assert( 0 ); }

	// YCoCg DXT5 (the output is in CoCg_Y format)
	void	DecompressYCoCgDXT5( const byte *inBuf, byte *outBuf, int width, int height );

	// YCoCg CTX1 + DXT5A (the output is in CoCg_Y format)
	void	DecompressYCoCgCTX1DXT5A( const byte *inBuf, byte *outBuf, int width, int height );

	// tangent space normal map decompression from DXT1 format
	void	DecompressNormalMapDXT1( const byte *inBuf, byte *outBuf, int width, int height );
	void	DecompressNormalMapDXT1Renormalize( const byte *inBuf, byte *outBuf, int width, int height );

	// tangent space normal map decompression from DXT5 format
	void	DecompressNormalMapDXT5( const byte *inBuf, byte *outBuf, int width, int height );
	void	DecompressNormalMapDXT5Renormalize( const byte *inBuf, byte *outBuf, int width, int height );

	// tangent space normal map decompression from DXN2 format
	void	DecompressNormalMapDXN2( const byte *inBuf, byte *outBuf, int width, int height );

	// decompose a DXT image into indices and two images with colors
	void	DecomposeImageDXT1( const byte *inBuf, byte *colorIndices, byte *pic1, byte *pic2, int width, int height );
	void	DecomposeImageDXT5( const byte *inBuf, byte *colorIndices, byte *alphaIndices, byte *pic1, byte *pic2, int width, int height );

private:
	int					width;
	int					height;
	const byte *		inData;

	byte				ReadByte();
	unsigned short		ReadUShort();
	unsigned int		ReadUInt();
	unsigned short		ColorTo565( const byte *color ) const;
	void				ColorFrom565( unsigned short c565, byte *color ) const;
	unsigned short		NormalYTo565( byte y ) const;
	byte				NormalYFrom565( unsigned short c565 ) const;
	byte				NormalScaleFrom565( unsigned short c565 ) const;
	byte				NormalBiasFrom565( unsigned short c565 ) const;

	void				EmitBlock( byte *outPtr, int x, int y, const byte *colorBlock );
	void				DecodeAlphaValues( byte *colorBlock, const int offset );
	void				DecodeColorValues( byte *colorBlock, bool noBlack, bool writeAlpha );
	void				DecodeCTX1Values( byte *colorBlock );

	void				DecomposeColorBlock( byte colors[2][4], byte colorIndices[16], bool noBlack );
	void				DecomposeAlphaBlock( byte colors[2][4], byte alphaIndices[16] );

	void				DecodeNormalYValues( byte *normalBlock, const int offsetY, byte &bias, byte &scale );
	void				DeriveNormalZValues( byte *normalBlock );
};

/*
========================
idDxtDecoder::ReadByte
========================
*/
ID_INLINE byte idDxtDecoder::ReadByte() {
	byte b = *inData;
	inData += 1;
	return b;
}

/*
========================
idDxtDecoder::ReadUShort
========================
*/
ID_INLINE unsigned short idDxtDecoder::ReadUShort() {
	unsigned short s = *((unsigned short *)inData);
	inData += 2;
	return s;
}

/*
========================
idDxtDecoder::ReadUInt
========================
*/
ID_INLINE unsigned int idDxtDecoder::ReadUInt() {
	unsigned int i = *((unsigned int *)inData);
	inData += 4;
	return i;
}

/*
========================
idDxtDecoder::ColorTo565
========================
*/
ID_INLINE unsigned short idDxtDecoder::ColorTo565( const byte *color ) const {
	return ( ( color[ 0 ] >> 3 ) << 11 ) | ( ( color[ 1 ] >> 2 ) << 5 ) | ( color[ 2 ] >> 3 );
}

/*
========================
idDxtDecoder::ColorFrom565
========================
*/
ID_INLINE void idDxtDecoder::ColorFrom565( unsigned short c565, byte *color ) const {
	color[0] = byte( ( ( c565 >> 8 ) & ( ( ( 1 << ( 8 - 3 ) ) - 1 ) << 3 ) ) | ( ( c565 >> 13 ) & ((1<<3)-1) ) );
	color[1] = byte( ( ( c565 >> 3 ) & ( ( ( 1 << ( 8 - 2 ) ) - 1 ) << 2 ) ) | ( ( c565 >>  9 ) & ((1<<2)-1) ) );
	color[2] = byte( ( ( c565 << 3 ) & ( ( ( 1 << ( 8 - 3 ) ) - 1 ) << 3 ) ) | ( ( c565 >>  2 ) & ((1<<3)-1) ) );
}

/*
========================
idDxtDecoder::NormalYTo565
========================
*/
ID_INLINE unsigned short idDxtDecoder::NormalYTo565( byte y ) const {
	return ( ( y >> 2 ) << 5 );
}

/*
========================
idDxtDecoder::NormalYFrom565
========================
*/
ID_INLINE byte idDxtDecoder::NormalYFrom565( unsigned short c565 ) const {
	byte c = byte( ( c565 & ( ( ( 1 << 6 ) - 1 ) << 5 ) ) >> 3 );
	return ( c | ( c >> 6 ) );
}

/*
========================
idDxtDecoder::NormalBiasFrom565
========================
*/
ID_INLINE byte idDxtDecoder::NormalBiasFrom565( unsigned short c565 ) const {
	byte c = byte( ( c565 & ( ( ( 1 << 5 ) - 1 ) << 11 ) ) >> 8 );
	return ( c | ( c >> 5 ) );
}

/*
========================
idDxtDecoder::NormalScaleFrom565
========================
*/
ID_INLINE byte idDxtDecoder::NormalScaleFrom565( unsigned short c565 ) const {
	byte c = byte( ( c565 & ( ( ( 1 << 5 ) - 1 ) << 0 ) ) << 3 );
	return ( c | ( c >> 5 ) );
}

#endif // !__DXTCODEC_H__