DirectXTexCompress.cpp 25 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809
  1. //-------------------------------------------------------------------------------------
  2. // DirectXTexCompress.cpp
  3. //
  4. // DirectX Texture Library - Texture compression
  5. //
  6. // THIS CODE AND INFORMATION IS PROVIDED "AS IS" WITHOUT WARRANTY OF
  7. // ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING BUT NOT LIMITED TO
  8. // THE IMPLIED WARRANTIES OF MERCHANTABILITY AND/OR FITNESS FOR A
  9. // PARTICULAR PURPOSE.
  10. //
  11. // Copyright (c) Microsoft Corporation. All rights reserved.
  12. //
  13. // http://go.microsoft.com/fwlink/?LinkId=248926
  14. //-------------------------------------------------------------------------------------
  15. #include "directxtexp.h"
  16. #ifdef _OPENMP
  17. #include <omp.h>
  18. #pragma warning(disable : 4616 6993)
  19. #endif
  20. #include "bc.h"
  21. namespace DirectX
  22. {
  23. inline static DWORD _GetBCFlags( _In_ DWORD compress )
  24. {
  25. static_assert( TEX_COMPRESS_RGB_DITHER == BC_FLAGS_DITHER_RGB, "TEX_COMPRESS_* flags should match BC_FLAGS_*" );
  26. static_assert( TEX_COMPRESS_A_DITHER == BC_FLAGS_DITHER_A, "TEX_COMPRESS_* flags should match BC_FLAGS_*" );
  27. static_assert( TEX_COMPRESS_DITHER == (BC_FLAGS_DITHER_RGB | BC_FLAGS_DITHER_A), "TEX_COMPRESS_* flags should match BC_FLAGS_*" );
  28. static_assert( TEX_COMPRESS_UNIFORM == BC_FLAGS_UNIFORM, "TEX_COMPRESS_* flags should match BC_FLAGS_*" );
  29. return ( compress & (BC_FLAGS_DITHER_RGB|BC_FLAGS_DITHER_A|BC_FLAGS_UNIFORM) );
  30. }
  31. inline static DWORD _GetSRGBFlags( _In_ DWORD compress )
  32. {
  33. static_assert( TEX_COMPRESS_SRGB_IN == TEX_FILTER_SRGB_IN, "TEX_COMPRESS_SRGB* should match TEX_FILTER_SRGB*" );
  34. static_assert( TEX_COMPRESS_SRGB_OUT == TEX_FILTER_SRGB_OUT, "TEX_COMPRESS_SRGB* should match TEX_FILTER_SRGB*" );
  35. static_assert( TEX_COMPRESS_SRGB == TEX_FILTER_SRGB, "TEX_COMPRESS_SRGB* should match TEX_FILTER_SRGB*" );
  36. return ( compress & TEX_COMPRESS_SRGB );
  37. }
  38. inline static bool _DetermineEncoderSettings( _In_ DXGI_FORMAT format, _Out_ BC_ENCODE& pfEncode, _Out_ size_t& blocksize, _Out_ DWORD& cflags )
  39. {
  40. switch(format)
  41. {
  42. case DXGI_FORMAT_BC1_UNORM:
  43. case DXGI_FORMAT_BC1_UNORM_SRGB: pfEncode = nullptr; blocksize = 8; cflags = 0; break;
  44. case DXGI_FORMAT_BC2_UNORM:
  45. case DXGI_FORMAT_BC2_UNORM_SRGB: pfEncode = D3DXEncodeBC2; blocksize = 16; cflags = 0; break;
  46. case DXGI_FORMAT_BC3_UNORM:
  47. case DXGI_FORMAT_BC3_UNORM_SRGB: pfEncode = D3DXEncodeBC3; blocksize = 16; cflags = 0; break;
  48. case DXGI_FORMAT_BC4_UNORM: pfEncode = D3DXEncodeBC4U; blocksize = 8; cflags = TEX_FILTER_RGB_COPY_RED; break;
  49. case DXGI_FORMAT_BC4_SNORM: pfEncode = D3DXEncodeBC4S; blocksize = 8; cflags = TEX_FILTER_RGB_COPY_RED; break;
  50. case DXGI_FORMAT_BC5_UNORM: pfEncode = D3DXEncodeBC5U; blocksize = 16; cflags = TEX_FILTER_RGB_COPY_RED | TEX_FILTER_RGB_COPY_GREEN; break;
  51. case DXGI_FORMAT_BC5_SNORM: pfEncode = D3DXEncodeBC5S; blocksize = 16; cflags = TEX_FILTER_RGB_COPY_RED | TEX_FILTER_RGB_COPY_GREEN; break;
  52. case DXGI_FORMAT_BC6H_UF16: pfEncode = D3DXEncodeBC6HU; blocksize = 16; cflags = 0; break;
  53. case DXGI_FORMAT_BC6H_SF16: pfEncode = D3DXEncodeBC6HS; blocksize = 16; cflags = 0; break;
  54. case DXGI_FORMAT_BC7_UNORM:
  55. case DXGI_FORMAT_BC7_UNORM_SRGB: pfEncode = D3DXEncodeBC7; blocksize = 16; cflags = 0; break;
  56. default: pfEncode = nullptr; blocksize = 0; cflags = 0; return false;
  57. }
  58. return true;
  59. }
  60. //-------------------------------------------------------------------------------------
  61. static HRESULT _CompressBC( _In_ const Image& image, _In_ const Image& result, _In_ DWORD bcflags,
  62. _In_ DWORD srgb, _In_ float alphaRef )
  63. {
  64. if ( !image.pixels || !result.pixels )
  65. return E_POINTER;
  66. assert( image.width == result.width );
  67. assert( image.height == result.height );
  68. const DXGI_FORMAT format = image.format;
  69. size_t sbpp = BitsPerPixel( format );
  70. if ( !sbpp )
  71. return E_FAIL;
  72. if ( sbpp < 8 )
  73. {
  74. // We don't support compressing from monochrome (DXGI_FORMAT_R1_UNORM)
  75. return HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  76. }
  77. // Round to bytes
  78. sbpp = ( sbpp + 7 ) / 8;
  79. uint8_t *pDest = result.pixels;
  80. // Determine BC format encoder
  81. BC_ENCODE pfEncode;
  82. size_t blocksize;
  83. DWORD cflags;
  84. if ( !_DetermineEncoderSettings( result.format, pfEncode, blocksize, cflags ) )
  85. return HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  86. XMVECTOR temp[16];
  87. const uint8_t *pSrc = image.pixels;
  88. const size_t rowPitch = image.rowPitch;
  89. for( size_t h=0; h < image.height; h += 4 )
  90. {
  91. const uint8_t *sptr = pSrc;
  92. uint8_t* dptr = pDest;
  93. size_t ph = std::min<size_t>( 4, image.height - h );
  94. size_t w = 0;
  95. for( size_t count = 0; count < rowPitch; count += sbpp*4, w += 4 )
  96. {
  97. size_t pw = std::min<size_t>( 4, image.width - w );
  98. assert( pw > 0 && ph > 0 );
  99. if ( !_LoadScanline( &temp[0], pw, sptr, rowPitch, format ) )
  100. return E_FAIL;
  101. if ( ph > 1 )
  102. {
  103. if ( !_LoadScanline( &temp[4], pw, sptr + rowPitch, rowPitch, format ) )
  104. return E_FAIL;
  105. if ( ph > 2 )
  106. {
  107. if ( !_LoadScanline( &temp[8], pw, sptr + rowPitch*2, rowPitch, format ) )
  108. return E_FAIL;
  109. if ( ph > 3 )
  110. {
  111. if ( !_LoadScanline( &temp[12], pw, sptr + rowPitch*3, rowPitch, format ) )
  112. return E_FAIL;
  113. }
  114. }
  115. }
  116. if ( pw != 4 || ph != 4 )
  117. {
  118. // Replicate pixels for partial block
  119. static const size_t uSrc[] = { 0, 0, 0, 1 };
  120. if ( pw < 4 )
  121. {
  122. for( size_t t = 0; t < ph && t < 4; ++t )
  123. {
  124. for( size_t s = pw; s < 4; ++s )
  125. {
  126. #pragma prefast(suppress: 26000, "PREFAST false positive")
  127. temp[ (t << 2) | s ] = temp[ (t << 2) | uSrc[s] ];
  128. }
  129. }
  130. }
  131. if ( ph < 4 )
  132. {
  133. for( size_t t = ph; t < 4; ++t )
  134. {
  135. for( size_t s = 0; s < 4; ++s )
  136. {
  137. #pragma prefast(suppress: 26000, "PREFAST false positive")
  138. temp[ (t << 2) | s ] = temp[ (uSrc[t] << 2) | s ];
  139. }
  140. }
  141. }
  142. }
  143. _ConvertScanline( temp, 16, result.format, format, cflags | srgb );
  144. if ( pfEncode )
  145. pfEncode( dptr, temp, bcflags );
  146. else
  147. D3DXEncodeBC1( dptr, temp, alphaRef, bcflags );
  148. sptr += sbpp*4;
  149. dptr += blocksize;
  150. }
  151. pSrc += rowPitch*4;
  152. pDest += result.rowPitch;
  153. }
  154. return S_OK;
  155. }
  156. //-------------------------------------------------------------------------------------
  157. #ifdef _OPENMP
  158. static HRESULT _CompressBC_Parallel( _In_ const Image& image, _In_ const Image& result, _In_ DWORD bcflags,
  159. _In_ DWORD srgb, _In_ float alphaRef )
  160. {
  161. if ( !image.pixels || !result.pixels )
  162. return E_POINTER;
  163. assert( image.width == result.width );
  164. assert( image.height == result.height );
  165. const DXGI_FORMAT format = image.format;
  166. size_t sbpp = BitsPerPixel( format );
  167. if ( !sbpp )
  168. return E_FAIL;
  169. if ( sbpp < 8 )
  170. {
  171. // We don't support compressing from monochrome (DXGI_FORMAT_R1_UNORM)
  172. return HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  173. }
  174. // Round to bytes
  175. sbpp = ( sbpp + 7 ) / 8;
  176. // Determine BC format encoder
  177. BC_ENCODE pfEncode;
  178. size_t blocksize;
  179. DWORD cflags;
  180. if ( !_DetermineEncoderSettings( result.format, pfEncode, blocksize, cflags ) )
  181. return HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  182. // Refactored version of loop to support parallel independance
  183. const size_t nBlocks = std::max<size_t>(1, (image.width + 3) / 4 ) * std::max<size_t>(1, (image.height + 3) / 4 );
  184. bool fail = false;
  185. #pragma omp parallel for
  186. for( int nb=0; nb < static_cast<int>( nBlocks ); ++nb )
  187. {
  188. const size_t nbWidth = std::max<size_t>(1, (image.width + 3) / 4 );
  189. const size_t y = nb / nbWidth;
  190. const size_t x = nb - (y*nbWidth);
  191. assert( x < image.width && y < image.height );
  192. size_t rowPitch = image.rowPitch;
  193. const uint8_t *pSrc = image.pixels + (y*4*rowPitch) + (x*4*sbpp);
  194. uint8_t *pDest = result.pixels + (nb*blocksize);
  195. size_t ph = std::min<size_t>( 4, image.height - y );
  196. size_t pw = std::min<size_t>( 4, image.width - x );
  197. assert( pw > 0 && ph > 0 );
  198. XMVECTOR temp[16];
  199. if ( !_LoadScanline( &temp[0], pw, pSrc, rowPitch, format ) )
  200. fail = true;
  201. if ( ph > 1 )
  202. {
  203. if ( !_LoadScanline( &temp[4], pw, pSrc + rowPitch, rowPitch, format ) )
  204. fail = true;
  205. if ( ph > 2 )
  206. {
  207. if ( !_LoadScanline( &temp[8], pw, pSrc + rowPitch*2, rowPitch, format ) )
  208. fail = true;
  209. if ( ph > 3 )
  210. {
  211. if ( !_LoadScanline( &temp[12], pw, pSrc + rowPitch*3, rowPitch, format ) )
  212. fail = true;
  213. }
  214. }
  215. }
  216. if ( pw != 4 || ph != 4 )
  217. {
  218. // Replicate pixels for partial block
  219. static const size_t uSrc[] = { 0, 0, 0, 1 };
  220. if ( pw < 4 )
  221. {
  222. for( size_t t = 0; t < ph && t < 4; ++t )
  223. {
  224. for( size_t s = pw; s < 4; ++s )
  225. {
  226. temp[ (t << 2) | s ] = temp[ (t << 2) | uSrc[s] ];
  227. }
  228. }
  229. }
  230. if ( ph < 4 )
  231. {
  232. for( size_t t = ph; t < 4; ++t )
  233. {
  234. for( size_t s = 0; s < 4; ++s )
  235. {
  236. temp[ (t << 2) | s ] = temp[ (uSrc[t] << 2) | s ];
  237. }
  238. }
  239. }
  240. }
  241. _ConvertScanline( temp, 16, result.format, format, cflags | srgb );
  242. if ( pfEncode )
  243. pfEncode( pDest, temp, bcflags );
  244. else
  245. D3DXEncodeBC1( pDest, temp, alphaRef, bcflags );
  246. }
  247. return (fail) ? E_FAIL : S_OK;
  248. }
  249. #endif // _OPENMP
  250. //-------------------------------------------------------------------------------------
  251. static DXGI_FORMAT _DefaultDecompress( _In_ DXGI_FORMAT format )
  252. {
  253. switch( format )
  254. {
  255. case DXGI_FORMAT_BC1_TYPELESS:
  256. case DXGI_FORMAT_BC1_UNORM:
  257. case DXGI_FORMAT_BC2_TYPELESS:
  258. case DXGI_FORMAT_BC2_UNORM:
  259. case DXGI_FORMAT_BC3_TYPELESS:
  260. case DXGI_FORMAT_BC3_UNORM:
  261. case DXGI_FORMAT_BC7_TYPELESS:
  262. case DXGI_FORMAT_BC7_UNORM:
  263. return DXGI_FORMAT_R8G8B8A8_UNORM;
  264. case DXGI_FORMAT_BC1_UNORM_SRGB:
  265. case DXGI_FORMAT_BC2_UNORM_SRGB:
  266. case DXGI_FORMAT_BC3_UNORM_SRGB:
  267. case DXGI_FORMAT_BC7_UNORM_SRGB:
  268. return DXGI_FORMAT_R8G8B8A8_UNORM_SRGB;
  269. case DXGI_FORMAT_BC4_TYPELESS:
  270. case DXGI_FORMAT_BC4_UNORM:
  271. return DXGI_FORMAT_R8_UNORM;
  272. case DXGI_FORMAT_BC4_SNORM:
  273. return DXGI_FORMAT_R8_SNORM;
  274. case DXGI_FORMAT_BC5_TYPELESS:
  275. case DXGI_FORMAT_BC5_UNORM:
  276. return DXGI_FORMAT_R8G8_UNORM;
  277. case DXGI_FORMAT_BC5_SNORM:
  278. return DXGI_FORMAT_R8G8_SNORM;
  279. case DXGI_FORMAT_BC6H_TYPELESS:
  280. case DXGI_FORMAT_BC6H_UF16:
  281. case DXGI_FORMAT_BC6H_SF16:
  282. // We could use DXGI_FORMAT_R32G32B32_FLOAT here since BC6H is always Alpha 1.0,
  283. // but this format is more supported by viewers
  284. return DXGI_FORMAT_R32G32B32A32_FLOAT;
  285. default:
  286. return DXGI_FORMAT_UNKNOWN;
  287. }
  288. }
  289. //-------------------------------------------------------------------------------------
  290. static HRESULT _DecompressBC( _In_ const Image& cImage, _In_ const Image& result )
  291. {
  292. if ( !cImage.pixels || !result.pixels )
  293. return E_POINTER;
  294. assert( cImage.width == result.width );
  295. assert( cImage.height == result.height );
  296. const DXGI_FORMAT format = result.format;
  297. size_t dbpp = BitsPerPixel( format );
  298. if ( !dbpp )
  299. return E_FAIL;
  300. if ( dbpp < 8 )
  301. {
  302. // We don't support decompressing to monochrome (DXGI_FORMAT_R1_UNORM)
  303. return HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  304. }
  305. // Round to bytes
  306. dbpp = ( dbpp + 7 ) / 8;
  307. uint8_t *pDest = result.pixels;
  308. if ( !pDest )
  309. return E_POINTER;
  310. // Promote "typeless" BC formats
  311. DXGI_FORMAT cformat;
  312. switch( cImage.format )
  313. {
  314. case DXGI_FORMAT_BC1_TYPELESS: cformat = DXGI_FORMAT_BC1_UNORM; break;
  315. case DXGI_FORMAT_BC2_TYPELESS: cformat = DXGI_FORMAT_BC2_UNORM; break;
  316. case DXGI_FORMAT_BC3_TYPELESS: cformat = DXGI_FORMAT_BC3_UNORM; break;
  317. case DXGI_FORMAT_BC4_TYPELESS: cformat = DXGI_FORMAT_BC4_UNORM; break;
  318. case DXGI_FORMAT_BC5_TYPELESS: cformat = DXGI_FORMAT_BC5_UNORM; break;
  319. case DXGI_FORMAT_BC6H_TYPELESS: cformat = DXGI_FORMAT_BC6H_UF16; break;
  320. case DXGI_FORMAT_BC7_TYPELESS: cformat = DXGI_FORMAT_BC7_UNORM; break;
  321. default: cformat = cImage.format; break;
  322. }
  323. // Determine BC format decoder
  324. BC_DECODE pfDecode;
  325. size_t sbpp;
  326. switch(cformat)
  327. {
  328. case DXGI_FORMAT_BC1_UNORM:
  329. case DXGI_FORMAT_BC1_UNORM_SRGB: pfDecode = D3DXDecodeBC1; sbpp = 8; break;
  330. case DXGI_FORMAT_BC2_UNORM:
  331. case DXGI_FORMAT_BC2_UNORM_SRGB: pfDecode = D3DXDecodeBC2; sbpp = 16; break;
  332. case DXGI_FORMAT_BC3_UNORM:
  333. case DXGI_FORMAT_BC3_UNORM_SRGB: pfDecode = D3DXDecodeBC3; sbpp = 16; break;
  334. case DXGI_FORMAT_BC4_UNORM: pfDecode = D3DXDecodeBC4U; sbpp = 8; break;
  335. case DXGI_FORMAT_BC4_SNORM: pfDecode = D3DXDecodeBC4S; sbpp = 8; break;
  336. case DXGI_FORMAT_BC5_UNORM: pfDecode = D3DXDecodeBC5U; sbpp = 16; break;
  337. case DXGI_FORMAT_BC5_SNORM: pfDecode = D3DXDecodeBC5S; sbpp = 16; break;
  338. case DXGI_FORMAT_BC6H_UF16: pfDecode = D3DXDecodeBC6HU; sbpp = 16; break;
  339. case DXGI_FORMAT_BC6H_SF16: pfDecode = D3DXDecodeBC6HS; sbpp = 16; break;
  340. case DXGI_FORMAT_BC7_UNORM:
  341. case DXGI_FORMAT_BC7_UNORM_SRGB: pfDecode = D3DXDecodeBC7; sbpp = 16; break;
  342. default:
  343. return HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  344. }
  345. XMVECTOR temp[16];
  346. const uint8_t *pSrc = cImage.pixels;
  347. const size_t rowPitch = result.rowPitch;
  348. for( size_t h=0; h < cImage.height; h += 4 )
  349. {
  350. const uint8_t *sptr = pSrc;
  351. uint8_t* dptr = pDest;
  352. size_t ph = std::min<size_t>( 4, cImage.height - h );
  353. size_t w = 0;
  354. for( size_t count = 0; count < cImage.rowPitch; count += sbpp, w += 4 )
  355. {
  356. pfDecode( temp, sptr );
  357. _ConvertScanline( temp, 16, format, cformat, 0 );
  358. size_t pw = std::min<size_t>( 4, cImage.width - w );
  359. assert( pw > 0 && ph > 0 );
  360. if ( !_StoreScanline( dptr, rowPitch, format, &temp[0], pw ) )
  361. return E_FAIL;
  362. if ( ph > 1 )
  363. {
  364. if ( !_StoreScanline( dptr + rowPitch, rowPitch, format, &temp[4], pw ) )
  365. return E_FAIL;
  366. if ( ph > 2 )
  367. {
  368. if ( !_StoreScanline( dptr + rowPitch*2, rowPitch, format, &temp[8], pw ) )
  369. return E_FAIL;
  370. if ( ph > 3 )
  371. {
  372. if ( !_StoreScanline( dptr + rowPitch*3, rowPitch, format, &temp[12], pw ) )
  373. return E_FAIL;
  374. }
  375. }
  376. }
  377. sptr += sbpp;
  378. dptr += dbpp*4;
  379. }
  380. pSrc += cImage.rowPitch;
  381. pDest += rowPitch*4;
  382. }
  383. return S_OK;
  384. }
  385. //-------------------------------------------------------------------------------------
  386. bool _IsAlphaAllOpaqueBC( _In_ const Image& cImage )
  387. {
  388. if ( !cImage.pixels )
  389. return false;
  390. // Promote "typeless" BC formats
  391. DXGI_FORMAT cformat;
  392. switch( cImage.format )
  393. {
  394. case DXGI_FORMAT_BC1_TYPELESS: cformat = DXGI_FORMAT_BC1_UNORM; break;
  395. case DXGI_FORMAT_BC2_TYPELESS: cformat = DXGI_FORMAT_BC2_UNORM; break;
  396. case DXGI_FORMAT_BC3_TYPELESS: cformat = DXGI_FORMAT_BC3_UNORM; break;
  397. case DXGI_FORMAT_BC7_TYPELESS: cformat = DXGI_FORMAT_BC7_UNORM; break;
  398. default: cformat = cImage.format; break;
  399. }
  400. // Determine BC format decoder
  401. BC_DECODE pfDecode;
  402. size_t sbpp;
  403. switch(cformat)
  404. {
  405. case DXGI_FORMAT_BC1_UNORM:
  406. case DXGI_FORMAT_BC1_UNORM_SRGB: pfDecode = D3DXDecodeBC1; sbpp = 8; break;
  407. case DXGI_FORMAT_BC2_UNORM:
  408. case DXGI_FORMAT_BC2_UNORM_SRGB: pfDecode = D3DXDecodeBC2; sbpp = 16; break;
  409. case DXGI_FORMAT_BC3_UNORM:
  410. case DXGI_FORMAT_BC3_UNORM_SRGB: pfDecode = D3DXDecodeBC3; sbpp = 16; break;
  411. case DXGI_FORMAT_BC7_UNORM:
  412. case DXGI_FORMAT_BC7_UNORM_SRGB: pfDecode = D3DXDecodeBC7; sbpp = 16; break;
  413. default:
  414. // BC4, BC5, and BC6 don't have alpha channels
  415. return false;
  416. }
  417. // Scan blocks for non-opaque alpha
  418. static const XMVECTORF32 threshold = { 0.99f, 0.99f, 0.99f, 0.99f };
  419. XMVECTOR temp[16];
  420. const uint8_t *pPixels = cImage.pixels;
  421. for( size_t h = 0; h < cImage.height; h += 4 )
  422. {
  423. const uint8_t *ptr = pPixels;
  424. size_t ph = std::min<size_t>( 4, cImage.height - h );
  425. size_t w = 0;
  426. for( size_t count = 0; count < cImage.rowPitch; count += sbpp, w += 4 )
  427. {
  428. pfDecode( temp, ptr );
  429. size_t pw = std::min<size_t>( 4, cImage.width - w );
  430. assert( pw > 0 && ph > 0 );
  431. if ( pw == 4 && ph == 4 )
  432. {
  433. // Full blocks
  434. for( size_t j = 0; j < 16; ++j )
  435. {
  436. XMVECTOR alpha = XMVectorSplatW( temp[j] );
  437. if ( XMVector4Less( alpha, threshold ) )
  438. return false;
  439. }
  440. }
  441. else
  442. {
  443. // Handle partial blocks
  444. for( size_t y = 0; y < ph; ++y )
  445. {
  446. for( size_t x = 0; x < pw; ++x )
  447. {
  448. XMVECTOR alpha = XMVectorSplatW( temp[ y * 4 + x ] );
  449. if ( XMVector4Less( alpha, threshold ) )
  450. return false;
  451. }
  452. }
  453. }
  454. ptr += sbpp;
  455. }
  456. pPixels += cImage.rowPitch;
  457. }
  458. return true;
  459. }
  460. //=====================================================================================
  461. // Entry-points
  462. //=====================================================================================
  463. //-------------------------------------------------------------------------------------
  464. // Compression
  465. //-------------------------------------------------------------------------------------
  466. _Use_decl_annotations_
  467. HRESULT Compress( const Image& srcImage, DXGI_FORMAT format, DWORD compress, float alphaRef, ScratchImage& image )
  468. {
  469. if ( IsCompressed(srcImage.format) || !IsCompressed(format) )
  470. return E_INVALIDARG;
  471. if ( IsTypeless(format)
  472. || IsTypeless(srcImage.format) || IsPlanar(srcImage.format) || IsPalettized(srcImage.format) )
  473. return HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  474. // Create compressed image
  475. HRESULT hr = image.Initialize2D( format, srcImage.width, srcImage.height, 1, 1 );
  476. if ( FAILED(hr) )
  477. return hr;
  478. const Image *img = image.GetImage( 0, 0, 0 );
  479. if ( !img )
  480. {
  481. image.Release();
  482. return E_POINTER;
  483. }
  484. // Compress single image
  485. if (compress & TEX_COMPRESS_PARALLEL)
  486. {
  487. #ifndef _OPENMP
  488. return E_NOTIMPL;
  489. #else
  490. hr = _CompressBC_Parallel( srcImage, *img, _GetBCFlags( compress ), _GetSRGBFlags( compress ), alphaRef );
  491. #endif // _OPENMP
  492. }
  493. else
  494. {
  495. hr = _CompressBC( srcImage, *img, _GetBCFlags( compress ), _GetSRGBFlags( compress ), alphaRef );
  496. }
  497. if ( FAILED(hr) )
  498. image.Release();
  499. return hr;
  500. }
  501. _Use_decl_annotations_
  502. HRESULT Compress( const Image* srcImages, size_t nimages, const TexMetadata& metadata,
  503. DXGI_FORMAT format, DWORD compress, float alphaRef, ScratchImage& cImages )
  504. {
  505. if ( !srcImages || !nimages )
  506. return E_INVALIDARG;
  507. if ( IsCompressed(metadata.format) || !IsCompressed(format) )
  508. return E_INVALIDARG;
  509. if ( IsTypeless(format)
  510. || IsTypeless(metadata.format) || IsPlanar(metadata.format) || IsPalettized(metadata.format) )
  511. return HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  512. cImages.Release();
  513. TexMetadata mdata2 = metadata;
  514. mdata2.format = format;
  515. HRESULT hr = cImages.Initialize( mdata2 );
  516. if ( FAILED(hr) )
  517. return hr;
  518. if ( nimages != cImages.GetImageCount() )
  519. {
  520. cImages.Release();
  521. return E_FAIL;
  522. }
  523. const Image* dest = cImages.GetImages();
  524. if ( !dest )
  525. {
  526. cImages.Release();
  527. return E_POINTER;
  528. }
  529. for( size_t index=0; index < nimages; ++index )
  530. {
  531. assert( dest[ index ].format == format );
  532. const Image& src = srcImages[ index ];
  533. if ( src.width != dest[ index ].width || src.height != dest[ index ].height )
  534. {
  535. cImages.Release();
  536. return E_FAIL;
  537. }
  538. if ( (compress & TEX_COMPRESS_PARALLEL) )
  539. {
  540. #ifndef _OPENMP
  541. return E_NOTIMPL;
  542. #else
  543. if ( compress & TEX_COMPRESS_PARALLEL )
  544. {
  545. hr = _CompressBC_Parallel( src, dest[ index ], _GetBCFlags( compress ), _GetSRGBFlags( compress ), alphaRef );
  546. if ( FAILED(hr) )
  547. {
  548. cImages.Release();
  549. return hr;
  550. }
  551. }
  552. #endif // _OPENMP
  553. }
  554. else
  555. {
  556. hr = _CompressBC( src, dest[ index ], _GetBCFlags( compress ), _GetSRGBFlags( compress ), alphaRef );
  557. if ( FAILED(hr) )
  558. {
  559. cImages.Release();
  560. return hr;
  561. }
  562. }
  563. }
  564. return S_OK;
  565. }
  566. //-------------------------------------------------------------------------------------
  567. // Decompression
  568. //-------------------------------------------------------------------------------------
  569. _Use_decl_annotations_
  570. HRESULT Decompress( const Image& cImage, DXGI_FORMAT format, ScratchImage& image )
  571. {
  572. if ( !IsCompressed(cImage.format) || IsCompressed(format) )
  573. return E_INVALIDARG;
  574. if ( format == DXGI_FORMAT_UNKNOWN )
  575. {
  576. // Pick a default decompressed format based on BC input format
  577. format = _DefaultDecompress( cImage.format );
  578. if ( format == DXGI_FORMAT_UNKNOWN )
  579. {
  580. // Input is not a compressed format
  581. return E_INVALIDARG;
  582. }
  583. }
  584. else
  585. {
  586. if ( !IsValid(format) )
  587. return E_INVALIDARG;
  588. if ( IsTypeless(format) || IsPlanar(format) || IsPalettized(format) )
  589. return HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  590. }
  591. // Create decompressed image
  592. HRESULT hr = image.Initialize2D( format, cImage.width, cImage.height, 1, 1 );
  593. if ( FAILED(hr) )
  594. return hr;
  595. const Image *img = image.GetImage( 0, 0, 0 );
  596. if ( !img )
  597. {
  598. image.Release();
  599. return E_POINTER;
  600. }
  601. // Decompress single image
  602. hr = _DecompressBC( cImage, *img );
  603. if ( FAILED(hr) )
  604. image.Release();
  605. return hr;
  606. }
  607. _Use_decl_annotations_
  608. HRESULT Decompress( const Image* cImages, size_t nimages, const TexMetadata& metadata,
  609. DXGI_FORMAT format, ScratchImage& images )
  610. {
  611. if ( !cImages || !nimages )
  612. return E_INVALIDARG;
  613. if ( !IsCompressed(metadata.format) || IsCompressed(format) )
  614. return E_INVALIDARG;
  615. if ( format == DXGI_FORMAT_UNKNOWN )
  616. {
  617. // Pick a default decompressed format based on BC input format
  618. format = _DefaultDecompress( cImages[0].format );
  619. if ( format == DXGI_FORMAT_UNKNOWN )
  620. {
  621. // Input is not a compressed format
  622. return E_FAIL;
  623. }
  624. }
  625. else
  626. {
  627. if ( !IsValid(format) )
  628. return E_INVALIDARG;
  629. if ( IsTypeless(format) || IsPlanar(format) || IsPalettized(format) )
  630. HRESULT_FROM_WIN32( ERROR_NOT_SUPPORTED );
  631. }
  632. images.Release();
  633. TexMetadata mdata2 = metadata;
  634. mdata2.format = format;
  635. HRESULT hr = images.Initialize( mdata2 );
  636. if ( FAILED(hr) )
  637. return hr;
  638. if ( nimages != images.GetImageCount() )
  639. {
  640. images.Release();
  641. return E_FAIL;
  642. }
  643. const Image* dest = images.GetImages();
  644. if ( !dest )
  645. {
  646. images.Release();
  647. return E_POINTER;
  648. }
  649. for( size_t index=0; index < nimages; ++index )
  650. {
  651. assert( dest[ index ].format == format );
  652. const Image& src = cImages[ index ];
  653. if ( !IsCompressed( src.format ) )
  654. {
  655. images.Release();
  656. return E_FAIL;
  657. }
  658. if ( src.width != dest[ index ].width || src.height != dest[ index ].height )
  659. {
  660. images.Release();
  661. return E_FAIL;
  662. }
  663. hr = _DecompressBC( src, dest[ index ] );
  664. if ( FAILED(hr) )
  665. {
  666. images.Release();
  667. return hr;
  668. }
  669. }
  670. return S_OK;
  671. }
  672. }; // namespace