update

Kitsune44 · Kitsune44 · commit 1cc0264c6d27 · 2026-06-20T13:04:22.000+02:00
diff --git a/src/game/client/videoservices/video_ffmpeg.cpp b/src/game/client/videoservices/video_ffmpeg.cpp
@@ -441,10 +441,10 @@ void VideoFFmpegPlayer::PrintInfo( std::string &filePath ) noexcept {
 
     ConColorMsg( Color( 77, 166, 255, 150 ), "  Decoder:\n" );
     if ( decoder != nullptr ) {
-        ConColorMsg( Color( 153, 204, 255, 255 ), "    Decoder:        %s (%s)\n", decoder->name ? decoder->name : "unknown", decoder->long_name ? decoder->long_name : "unknown" );
+        ConColorMsg( Color( 153, 204, 255, 255 ), "    Decoder:         %s (%s)\n", decoder->name ? decoder->name : "unknown", decoder->long_name ? decoder->long_name : "unknown" );
     }
     else {
-        ConColorMsg( Color( 153, 204, 255, 255 ), "    Decoder:        unknown\n" );
+        ConColorMsg( Color( 153, 204, 255, 255 ), "    Decoder:         unknown\n" );
     }
     ConColorMsg( Color( 153, 204, 255, 150 ), "    Pixel Format:    %s\n", pixFmt ? pixFmt : "unknown" );
     ConColorMsg( Color( 153, 204, 255, 255 ), "    Color range:     %s\n", range_str ? range_str : "unknown" );
diff --git a/src/game/client/videoservices/video_material_simd.cpp b/src/game/client/videoservices/video_material_simd.cpp
@@ -46,15 +46,6 @@ VMSM_INLINE void VideoMaterialSIMD::RuntimeDispatch() noexcept
     else {
         m_memcpy_fn = memcpy_sse2;
     }
-
-    // Conversion function dispatch
-    /**/
-    if ( CPUHasAVX2() ) {
-        m_convert_u16_u8_rrs_fn = convert_u16_u8_rrs_avx2;
-    }
-    else {
-        m_convert_u16_u8_rrs_fn = convert_u16_u8_rrs_sse2;
-    }
 }
 
 // --------------------------------------------------------------------------------------------
@@ -63,7 +54,6 @@ VMSM_INLINE void VideoMaterialSIMD::RuntimeDispatch() noexcept
 // src - source buffer: AVFrame uint8_t/uint16_t, 32/64-byte aligned
 // --------------------------------------------------------------------------------------------
 
-
 #define MASK_64B 0x3F   // 6: 64-byte blocks (used with __m512i,  AVX-512 register = 512 bits)
 #define MASK_32B 0x1F   // 5: 32-byte blocks (used with __m256i, AVX/AVX2 register = 256 bits)
 #define MASK_16B  0xF   // 4: 16-byte blocks (used with __m128i, SSE/SSE2 register = 128 bits)
@@ -119,7 +109,7 @@ VMSM_INLINE void VideoMaterialSIMD::memcpy_sse2( uint8_t *VMSM_RESTRICT dst, uin
         mov edi, d
 
         align_loop :
-        movdqa xmm0, [ esi ]
+            movdqa xmm0, [ esi ]
             movdqa xmm1, [ esi + 16 ]
             movdqa xmm2, [ esi + 32 ]
             movdqa xmm3, [ esi + 48 ]
@@ -142,97 +132,6 @@ VMSM_INLINE void VideoMaterialSIMD::memcpy_sse2( uint8_t *VMSM_RESTRICT dst, uin
         memcpy( d, s, rem );
 }
 
-// --------------------------------------------------------------------------------------------
-// SIMD Convert U16 to U8 - Right Shift Implementations for Source Engine Video Materials
-// dst: Source Engine: IVTFTexture uint8_t, 1byte per pixel, 16-byte aligned 
-// src: FFmpeg: AVFrame uint16_t, 2byte per pixel, 32/64-byte aligned
-// --------------------------------------------------------------------------------------------
-
-//-----------------------------------------------------------------
-// SIMD Convert_U16_U8_RS: AVX2 STREAM Aligned(dst)-Unaligned(src)
-//-----------------------------------------------------------------
-
-VMSM_INLINE void VideoMaterialSIMD::convert_u16_u8_rrs_avx2(
-    uint8_t *VMSM_RESTRICT dst, const uint16_t *VMSM_RESTRICT src, size_t bts, int sft ) noexcept
-{
-    const int bs = 1 << ( sft - 1 );
-    const __m256i rnd = _mm256_set1_epi16( bs );
-
-    size_t bts2a = ( 64 - ( reinterpret_cast< uintptr_t >( dst ) & MASK_64B ) ) & MASK_64B;
-    if ( bts2a > 0 ) {
-        for ( size_t i = 0; i < bts2a; ++i ) {
-            dst[ i ] = static_cast< uint8_t >( ( src[ i ] + bs ) >> sft );
-        }
-        dst += bts2a;
-        src += bts2a;
-        bts -= bts2a;
-    }
-
-    const __m256i *s = reinterpret_cast< const __m256i * >( src );
-    __m256i *d = reinterpret_cast< __m256i * >( dst );
-
-    size_t blx = bts >> 6;
-    const size_t rem = bts & MASK_64B;
-
-    while ( blx-- )
-    {
-        __m256i v01 = _mm256_lddqu_si256( s++ );
-        __m256i v02 = _mm256_lddqu_si256( s++ );
-        __m256i v03 = _mm256_lddqu_si256( s++ );
-        __m256i v04 = _mm256_lddqu_si256( s++ );
-
-        v01 = _mm256_srli_epi16( _mm256_add_epi16( v01, rnd ), sft );
-        v02 = _mm256_srli_epi16( _mm256_add_epi16( v02, rnd ), sft );
-        v03 = _mm256_srli_epi16( _mm256_add_epi16( v03, rnd ), sft );
-        v04 = _mm256_srli_epi16( _mm256_add_epi16( v04, rnd ), sft );
-
-        _mm256_stream_si256( d++, _mm256_permute4x64_epi64( _mm256_packus_epi16( v01, v02 ), 0xD8 ) );
-        _mm256_stream_si256( d++, _mm256_permute4x64_epi64( _mm256_packus_epi16( v03, v04 ), 0xD8 ) );
-    }
-    _mm_sfence();
-    if ( rem > 0 ) {
-        for ( size_t i = 0; i < rem; ++i ) {
-            reinterpret_cast< uint8_t * >( d )[ i ] =
-                static_cast< uint8_t >( ( reinterpret_cast< const uint16_t * >( s )[ i ] + bs ) >> sft );
-        }
-    }
-}
-
-//-----------------------------------------------------------------
-// SIMD Convert_U16_U8_RS: SSE2 STREAM Aligned(dst)-Aligned(src)
-//-----------------------------------------------------------------
-
-VMSM_INLINE void VideoMaterialSIMD::convert_u16_u8_rrs_sse2(
-    uint8_t *VMSM_RESTRICT dst, const uint16_t *VMSM_RESTRICT src, size_t bts, int sft ) noexcept
-{
-    const int bs = 1 << ( sft - 1 );
-    const __m128i rnd = _mm_set1_epi16( bs );
-
-    const __m128i *s = reinterpret_cast< const __m128i * >( src );
-    __m128i *d = reinterpret_cast< __m128i * >( dst );
-
-    size_t blx = bts >> 4;
-    const size_t rem = bts & MASK_16B;
-
-    while ( blx-- )
-    {
-        __m128i v01 = _mm_load_si128( s++ );
-        __m128i v02 = _mm_load_si128( s++ );
-
-        v01 = _mm_srli_epi16( _mm_add_epi16( v01, rnd ), sft );
-        v02 = _mm_srli_epi16( _mm_add_epi16( v02, rnd ), sft );
-
-        _mm_stream_si128( d++, _mm_packus_epi16( v01, v02 ) );
-    }
-    _mm_sfence();
-    if ( rem > 0 ) {
-        for ( size_t i = 0; i < rem; ++i ) {
-            reinterpret_cast< uint8_t * >( d )[ i ] =
-                static_cast< uint8_t >( ( reinterpret_cast< const uint16_t * >( s )[ i ] + bs ) >> sft );
-        }
-    }
-}
-
 // --------------------------------------------------------------------------------------------
 // CPU Feature Detection
 // These functions check for the presence of specific SIMD instruction sets
diff --git a/src/game/client/videoservices/video_material_simd.h b/src/game/client/videoservices/video_material_simd.h
@@ -51,19 +51,6 @@ struct VideoMaterialSIMD final {
         m_memcpy_fn( dst, src, bts );
     }
 
-    /**
-     * @brief Convert uint16_t array to uint8_t with right shift
-     * @param dst - destination buffer: Valve Source Engine: IVTFTexture I8, uint8_t, 16-byte aligned
-     * @param src - source buffer: AVFrame uint16_t, 32/64-byte aligned
-     * @param bts - Number of bytes to copy
-     * @param sft - Right shift amount (0-15)
-     */
-    VMSM_INLINE void Convert_U16_U8_RRS(
-        uint8_t *VMSM_RESTRICT dst, const uint16_t *VMSM_RESTRICT src, size_t bts, int sft ) const noexcept
-    {
-        m_convert_u16_u8_rrs_fn( dst, src, bts, sft );
-    }
-
     // --------------------------------------------------------------------------------------------
     // CPU feature queries
     // --------------------------------------------------------------------------------------------
@@ -84,11 +71,9 @@ struct VideoMaterialSIMD final {
 
     // Function pointer types
     using MemcpyFn = void( * )( uint8_t *VMSM_RESTRICT, uint8_t *VMSM_RESTRICT, size_t );
-    using ConvertShiftFn = void( * )( uint8_t *VMSM_RESTRICT, const uint16_t *VMSM_RESTRICT, size_t, int );
 
     // Function pointers (jump table)
     MemcpyFn m_memcpy_fn = nullptr;
-    ConvertShiftFn m_convert_u16_u8_rrs_fn = nullptr;
 
     // --------------------------------------------------------------------------------------------
     // Memcpy implementations
@@ -98,13 +83,4 @@ struct VideoMaterialSIMD final {
     static VMSM_INLINE void memcpy_avx2( uint8_t *VMSM_RESTRICT dst, uint8_t *VMSM_RESTRICT src, size_t bts ) noexcept;
     // SSE2
     static VMSM_INLINE void memcpy_sse2( uint8_t *VMSM_RESTRICT dst, uint8_t *VMSM_RESTRICT src, size_t bts ) noexcept;
-
-    // --------------------------------------------------------------------------------------------
-    // Convert_U16_U8_RRS implementations
-    // --------------------------------------------------------------------------------------------
-
-    // AVX2
-    static VMSM_INLINE void convert_u16_u8_rrs_avx2( uint8_t *VMSM_RESTRICT dst, const uint16_t *VMSM_RESTRICT src, size_t bts, int sft ) noexcept;
-    // SSE2
-    static VMSM_INLINE void convert_u16_u8_rrs_sse2( uint8_t *VMSM_RESTRICT dst, const uint16_t *VMSM_RESTRICT src, size_t bts, int sft ) noexcept;
 };
diff --git a/src/lib/public/shaderlib.lib b/src/lib/public/shaderlib.lib

Original file line number	Diff line number	Diff line change
`@@ -441,10 +441,10 @@ void VideoFFmpegPlayer::PrintInfo( std::string &filePath ) noexcept {`
`441`	`441`
`442`	`442`	`ConColorMsg( Color( 77, 166, 255, 150 ), " Decoder:\n" );`
`443`	`443`	`if ( decoder != nullptr ) {`
`444`		`- ConColorMsg( Color( 153, 204, 255, 255 ), " Decoder: %s (%s)\n", decoder->name ? decoder->name : "unknown", decoder->long_name ? decoder->long_name : "unknown" );`
	`444`	`+ ConColorMsg( Color( 153, 204, 255, 255 ), " Decoder: %s (%s)\n", decoder->name ? decoder->name : "unknown", decoder->long_name ? decoder->long_name : "unknown" );`
`445`	`445`	`}`
`446`	`446`	`else {`
`447`		`- ConColorMsg( Color( 153, 204, 255, 255 ), " Decoder: unknown\n" );`
	`447`	`+ ConColorMsg( Color( 153, 204, 255, 255 ), " Decoder: unknown\n" );`
`448`	`448`	`}`
`449`	`449`	`ConColorMsg( Color( 153, 204, 255, 150 ), " Pixel Format: %s\n", pixFmt ? pixFmt : "unknown" );`
`450`	`450`	`ConColorMsg( Color( 153, 204, 255, 255 ), " Color range: %s\n", range_str ? range_str : "unknown" );`