summaryrefslogtreecommitdiffstats
path: root/thirdparty/etcpak/ProcessRGB.cpp
diff options
context:
space:
mode:
authorBlueCube3310 <53150244+BlueCube3310@users.noreply.github.com>2024-02-05 18:53:35 +0100
committerBlueCube3310 <53150244+BlueCube3310@users.noreply.github.com>2024-02-05 18:53:35 +0100
commitbecf5b1d2343a8f675300bfbf398140549d641f6 (patch)
tree0a16dddf2add1f2bd92572ad41b60ba86989f29b /thirdparty/etcpak/ProcessRGB.cpp
parentd3352813ea44447bfbf135efdec23acc4d1d3f89 (diff)
downloadredot-engine-becf5b1d2343a8f675300bfbf398140549d641f6.tar.gz
[etcpak] Sync with upstream
Diffstat (limited to 'thirdparty/etcpak/ProcessRGB.cpp')
-rw-r--r--thirdparty/etcpak/ProcessRGB.cpp52
1 files changed, 29 insertions, 23 deletions
diff --git a/thirdparty/etcpak/ProcessRGB.cpp b/thirdparty/etcpak/ProcessRGB.cpp
index 0caa687bc6..e1487fa767 100644
--- a/thirdparty/etcpak/ProcessRGB.cpp
+++ b/thirdparty/etcpak/ProcessRGB.cpp
@@ -3266,16 +3266,21 @@ etcpak_force_inline static int16x8_t WidenMultiplier_EAC_NEON( int16x8_t multipl
#endif
+template<bool checkSolid = true>
static etcpak_force_inline uint64_t ProcessAlpha_ETC2( const uint8_t* src )
{
#if defined __SSE4_1__
- // Check solid
__m128i s = _mm_loadu_si128( (__m128i*)src );
- __m128i solidCmp = _mm_set1_epi8( src[0] );
- __m128i cmpRes = _mm_cmpeq_epi8( s, solidCmp );
- if( _mm_testc_si128( cmpRes, _mm_set1_epi32( -1 ) ) )
+
+ if( checkSolid )
{
- return src[0];
+ // Check solid
+ __m128i solidCmp = _mm_set1_epi8( src[0] );
+ __m128i cmpRes = _mm_cmpeq_epi8( s, solidCmp );
+ if( _mm_testc_si128( cmpRes, _mm_set1_epi32( -1 ) ) )
+ {
+ return src[0];
+ }
}
// Calculate min, max
@@ -3684,12 +3689,15 @@ static etcpak_force_inline uint64_t ProcessAlpha_ETC2( const uint8_t* src )
int srcMid;
uint8x16_t srcAlphaBlock = vld1q_u8( src );
{
- uint8_t ref = src[0];
- uint8x16_t a0 = vdupq_n_u8( ref );
- uint8x16_t r = vceqq_u8( srcAlphaBlock, a0 );
- int64x2_t m = vreinterpretq_s64_u8( r );
- if( m[0] == -1 && m[1] == -1 )
- return ref;
+ if( checkSolid )
+ {
+ uint8_t ref = src[0];
+ uint8x16_t a0 = vdupq_n_u8( ref );
+ uint8x16_t r = vceqq_u8( srcAlphaBlock, a0 );
+ int64x2_t m = vreinterpretq_s64_u8( r );
+ if( m[0] == -1 && m[1] == -1 )
+ return ref;
+ }
// srcRange
#ifdef __aarch64__
@@ -3759,6 +3767,7 @@ static etcpak_force_inline uint64_t ProcessAlpha_ETC2( const uint8_t* src )
#undef EAC_RECONSTRUCT_VALUE
#else
+ if( checkSolid )
{
bool solid = true;
const uint8_t* ptr = src + 1;
@@ -3849,7 +3858,6 @@ static etcpak_force_inline uint64_t ProcessAlpha_ETC2( const uint8_t* src )
#endif
}
-
void CompressEtc1Alpha( const uint32_t* src, uint64_t* dst, uint32_t blocks, size_t width )
{
int w = 0;
@@ -4176,14 +4184,13 @@ void CompressEtc2Rgba( const uint32_t* src, uint64_t* dst, uint32_t blocks, size
src += width * 3;
w = 0;
}
- *dst++ = ProcessAlpha_ETC2( alpha );
+ *dst++ = ProcessAlpha_ETC2<true>( alpha );
*dst++ = ProcessRGB_ETC2( (uint8_t*)rgba, useHeuristics );
}
while( --blocks );
}
-// -- GODOT start --
-void CompressEtc2R8( const uint32_t* src, uint64_t* dst, uint32_t blocks, size_t width )
+void CompressEacR( const uint32_t* src, uint64_t* dst, uint32_t blocks, size_t width )
{
int w = 0;
uint8_t r[4*4];
@@ -4239,12 +4246,12 @@ void CompressEtc2R8( const uint32_t* src, uint64_t* dst, uint32_t blocks, size_t
src += width * 3;
w = 0;
}
- *dst++ = ProcessAlpha_ETC2( r );
+ *dst++ = ProcessAlpha_ETC2<false>( r );
}
while( --blocks );
}
-void CompressEtc2RG8( const uint32_t* src, uint64_t* dst, uint32_t blocks, size_t width )
+void CompressEacRg( const uint32_t* src, uint64_t* dst, uint32_t blocks, size_t width )
{
int w = 0;
uint8_t rg[4*4*2];
@@ -4300,15 +4307,15 @@ void CompressEtc2RG8( const uint32_t* src, uint64_t* dst, uint32_t blocks, size_
src += width;
v = *src;
*ptrr++ = (v & 0xff0000) >> 16;
- *ptrg++ = (v & 0xff00) >> 8;
+ *ptrg++ = (v & 0xff00) >> 8;
src += width;
v = *src;
*ptrr++ = (v & 0xff0000) >> 16;
- *ptrg++ = (v & 0xff00) >> 8;
+ *ptrg++ = (v & 0xff00) >> 8;
src += width;
v = *src;
*ptrr++ = (v & 0xff0000) >> 16;
- *ptrg++ = (v & 0xff00) >> 8;
+ *ptrg++ = (v & 0xff00) >> 8;
src -= width * 3 - 1;
}
#endif
@@ -4317,9 +4324,8 @@ void CompressEtc2RG8( const uint32_t* src, uint64_t* dst, uint32_t blocks, size_
src += width * 3;
w = 0;
}
- *dst++ = ProcessAlpha_ETC2( rg );
- *dst++ = ProcessAlpha_ETC2( &rg[16] );
+ *dst++ = ProcessAlpha_ETC2<false>( rg );
+ *dst++ = ProcessAlpha_ETC2<false>( &rg[16] );
}
while( --blocks );
}
-// -- GODOT end --