ConvectionKernels_ETC.h 8.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127
  1. #pragma once
  2. #ifndef __CVTT_CONVECTIONKERNELS_ETC_H__
  3. #define __CVTT_CONVECTIONKERNELS_ETC_H__
  4. #include "ConvectionKernels.h"
  5. #include "ConvectionKernels_ParallelMath.h"
  6. namespace cvtt
  7. {
  8. struct Options;
  9. namespace Internal
  10. {
  11. class ETCComputer
  12. {
  13. public:
  14. static void CompressETC1Block(uint8_t *outputBuffer, const PixelBlockU8 *inputBlocks, ETC1CompressionData *compressionData, const Options &options);
  15. static void CompressETC2Block(uint8_t *outputBuffer, const PixelBlockU8 *inputBlocks, ETC2CompressionData *compressionData, const Options &options, bool punchthroughAlpha);
  16. static void CompressETC2AlphaBlock(uint8_t *outputBuffer, const PixelBlockU8 *inputBlocks, const Options &options);
  17. static void CompressEACBlock(uint8_t *outputBuffer, const PixelBlockScalarS16 *inputBlocks, bool isSigned, const Options &options);
  18. static ETC2CompressionData *AllocETC2Data(cvtt::Kernels::allocFunc_t allocFunc, void *context, const cvtt::Options &options);
  19. static void ReleaseETC2Data(ETC2CompressionData *compressionData, cvtt::Kernels::freeFunc_t freeFunc);
  20. static ETC1CompressionData *AllocETC1Data(cvtt::Kernels::allocFunc_t allocFunc, void *context);
  21. static void ReleaseETC1Data(ETC1CompressionData *compressionData, cvtt::Kernels::freeFunc_t freeFunc);
  22. private:
  23. typedef ParallelMath::Float MFloat;
  24. typedef ParallelMath::SInt16 MSInt16;
  25. typedef ParallelMath::UInt15 MUInt15;
  26. typedef ParallelMath::UInt16 MUInt16;
  27. typedef ParallelMath::SInt32 MSInt32;
  28. typedef ParallelMath::UInt31 MUInt31;
  29. struct DifferentialResolveStorage
  30. {
  31. static const unsigned int MaxAttemptsPerSector = 57 + 81 + 81 + 81 + 81 + 81 + 81 + 81;
  32. MUInt15 diffNumAttempts[2];
  33. MFloat diffErrors[2][MaxAttemptsPerSector];
  34. MUInt16 diffSelectors[2][MaxAttemptsPerSector];
  35. MUInt15 diffColors[2][MaxAttemptsPerSector];
  36. MUInt15 diffTables[2][MaxAttemptsPerSector];
  37. uint16_t attemptSortIndexes[2][MaxAttemptsPerSector];
  38. };
  39. struct HModeEval
  40. {
  41. MFloat errors[62][16];
  42. MUInt16 signBits[62];
  43. MUInt15 uniqueQuantizedColors[62];
  44. MUInt15 numUniqueColors[2];
  45. };
  46. struct ETC1CompressionDataInternal : public cvtt::ETC1CompressionData
  47. {
  48. explicit ETC1CompressionDataInternal(void *context)
  49. : m_context(context)
  50. {
  51. }
  52. DifferentialResolveStorage m_drs;
  53. void *m_context;
  54. };
  55. struct ETC2CompressionDataInternal : public cvtt::ETC2CompressionData
  56. {
  57. explicit ETC2CompressionDataInternal(void *context, const cvtt::Options &options);
  58. HModeEval m_h;
  59. DifferentialResolveStorage m_drs;
  60. void *m_context;
  61. float m_chromaSideAxis0[3];
  62. float m_chromaSideAxis1[3];
  63. };
  64. static MFloat ComputeErrorUniform(const MUInt15 pixelA[3], const MUInt15 pixelB[3]);
  65. static MFloat ComputeErrorWeighted(const MUInt15 reconstructed[3], const MFloat pixelB[3], const Options options);
  66. static MFloat ComputeErrorFakeBT709(const MUInt15 reconstructed[3], const MFloat pixelB[3]);
  67. static void TestHalfBlock(MFloat &outError, MUInt16 &outSelectors, MUInt15 quantizedPackedColor, const MUInt15 pixels[8][3], const MFloat preWeightedPixels[8][3], const MSInt16 modifiers[4], bool isDifferential, const Options &options);
  68. static void TestHalfBlockPunchthrough(MFloat &outError, MUInt16 &outSelectors, MUInt15 quantizedPackedColor, const MUInt15 pixels[8][3], const MFloat preWeightedPixels[8][3], const ParallelMath::Int16CompFlag isTransparent[8], const MUInt15 modifier, const Options &options);
  69. static void FindBestDifferentialCombination(int flip, int d, const ParallelMath::Int16CompFlag canIgnoreSector[2], ParallelMath::Int16CompFlag& bestIsThisMode, MFloat& bestTotalError, MUInt15& bestFlip, MUInt15& bestD, MUInt15 bestColors[2], MUInt16 bestSelectors[2], MUInt15 bestTables[2], DifferentialResolveStorage &drs);
  70. static ParallelMath::Int16CompFlag ETCDifferentialIsLegalForChannel(const MUInt15 &a, const MUInt15 &b);
  71. static ParallelMath::Int16CompFlag ETCDifferentialIsLegal(const MUInt15 &a, const MUInt15 &b);
  72. static bool ETCDifferentialIsLegalForChannelScalar(const uint16_t &a, const uint16_t &b);
  73. static bool ETCDifferentialIsLegalScalar(const uint16_t &a, const uint16_t &b);
  74. static void EncodeTMode(uint8_t *outputBuffer, MFloat &bestError, const ParallelMath::Int16CompFlag isIsolated[16], const MUInt15 pixels[16][3], const MFloat preWeightedPixels[16][3], const Options &options);
  75. static void EncodeHMode(uint8_t *outputBuffer, MFloat &bestError, const ParallelMath::Int16CompFlag groupings[16], const MUInt15 pixels[16][3], HModeEval &he, const MFloat preWeightedPixels[16][3], const Options &options);
  76. static void EncodeVirtualTModePunchthrough(uint8_t *outputBuffer, MFloat &bestError, const ParallelMath::Int16CompFlag isIsolated[16], const MUInt15 pixels[16][3], const MFloat preWeightedPixels[16][3], const ParallelMath::Int16CompFlag isTransparent[16], const ParallelMath::Int16CompFlag& anyTransparent, const ParallelMath::Int16CompFlag& allTransparent, const Options &options);
  77. static MUInt15 DecodePlanarCoeff(const MUInt15 &coeff, int ch);
  78. static void EncodePlanar(uint8_t *outputBuffer, MFloat &bestError, const MUInt15 pixels[16][3], const MFloat preWeightedPixels[16][3], const Options &options);
  79. static void CompressETC1BlockInternal(MFloat &bestTotalError, uint8_t *outputBuffer, const MUInt15 pixels[16][3], const MFloat preWeightedPixels[16][3], DifferentialResolveStorage& compressionData, const Options &options, bool punchthrough);
  80. static void CompressETC1PunchthroughBlockInternal(MFloat &bestTotalError, uint8_t *outputBuffer, const MUInt15 pixels[16][3], const MFloat preWeightedPixels[16][3], const ParallelMath::Int16CompFlag isTransparent[16], DifferentialResolveStorage& compressionData, const Options &options);
  81. static void CompressETC2AlphaBlockInternal(uint8_t *outputBuffer, const MUInt15 pixels[16], bool is11Bit, bool isSigned, const Options &options);
  82. static void ExtractBlocks(MUInt15 pixels[16][3], MFloat preWeightedPixels[16][3], const PixelBlockU8 *inputBlocks, const Options &options);
  83. static void ResolveHalfBlockFakeBT709RoundingAccurate(MUInt15 quantized[3], const MUInt15 sectorCumulative[3], bool isDifferential);
  84. static void ResolveHalfBlockFakeBT709RoundingFast(MUInt15 quantized[3], const MUInt15 sectorCumulative[3], bool isDifferential);
  85. static void ResolveTHFakeBT709Rounding(MUInt15 quantized[3], const MUInt15 target[3], const MUInt15 &granularity);
  86. static void ConvertToFakeBT709(MFloat yuv[3], const MUInt15 color[3]);
  87. static void ConvertToFakeBT709(MFloat yuv[3], const MFloat color[3]);
  88. static void ConvertToFakeBT709(MFloat yuv[3], const MFloat &r, const MFloat &g, const MFloat &b);
  89. static void ConvertFromFakeBT709(MFloat rgb[3], const MFloat yuv[3]);
  90. static void QuantizeETC2Alpha(int tableIndex, const MUInt15& value, const MUInt15& baseValue, const MUInt15& multiplier, bool is11Bit, bool isSigned, MUInt15& outIndexes, MUInt15& outQuantizedValues);
  91. static void EmitTModeBlock(uint8_t *outputBuffer, const ParallelMath::ScalarUInt16 lineColor[3], const ParallelMath::ScalarUInt16 isolatedColor[3], int32_t packedSelectors, ParallelMath::ScalarUInt16 table, bool opaque);
  92. static void EmitHModeBlock(uint8_t *outputBuffer, const ParallelMath::ScalarUInt16 blockColors[2], ParallelMath::ScalarUInt16 sectorBits, ParallelMath::ScalarUInt16 signBits, ParallelMath::ScalarUInt16 table, bool opaque);
  93. static void EmitETC1Block(uint8_t *outputBuffer, int blockBestFlip, int blockBestD, const int blockBestColors[2][3], const int blockBestTables[2], const ParallelMath::ScalarUInt16 blockBestSelectors[2], bool transparent);
  94. static const int g_flipTables[2][2][8];
  95. };
  96. }
  97. }
  98. #endif