mirror of
https://github.com/dolphin-emu/dolphin.git
synced 2024-11-14 21:37:52 -07:00
This needs to be in the right place to work for <sse4. Going to bed now :P.
git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@6776 8ced0084-cf51-0410-be5f-012b33b47a6e
This commit is contained in:
parent
87bd4dd4b9
commit
62b79028ef
@ -1031,9 +1031,9 @@ PC_TexFormat TexDecoder_Decode_RGBA(u32 * dst, const u8 * src, int width, int he
|
|||||||
// (bbbbbbbb bbbbbbbb aaaaaaaa aaaaaaaa) -> (bbbbbbbb 00000000 aaaaaaaa 00000000)
|
// (bbbbbbbb bbbbbbbb aaaaaaaa aaaaaaaa) -> (bbbbbbbb 00000000 aaaaaaaa 00000000)
|
||||||
// And last but not least, _mm_or_si128 ORs those two together, giving us the interleaving we desire:
|
// And last but not least, _mm_or_si128 ORs those two together, giving us the interleaving we desire:
|
||||||
// (00000000 BBBBBBBB 00000000 AAAAAAAA) | (bbbbbbbb 00000000 aaaaaaaa 00000000) -> (bbbbbbbb BBBBBBBB aaaaaaaa AAAAAAAA)
|
// (00000000 BBBBBBBB 00000000 AAAAAAAA) | (bbbbbbbb 00000000 aaaaaaaa 00000000) -> (bbbbbbbb BBBBBBBB aaaaaaaa AAAAAAAA)
|
||||||
|
__m128i o1, o2, o3, o4;
|
||||||
#if _M_SSE >= 0x401
|
#if _M_SSE >= 0x401
|
||||||
// SSE4 gives 5-10% improvement in I4 texture decode when this runs:
|
// SSE4 gives 5-10% improvement in I4 texture decode when this runs:
|
||||||
__m128i o1, o2, o3, o4;
|
|
||||||
if (cpu_info.bSSE4_1) {
|
if (cpu_info.bSSE4_1) {
|
||||||
o1 = _mm_blend_epi16(i251, i151, 0x33); // 0x33 = 00110011
|
o1 = _mm_blend_epi16(i251, i151, 0x33); // 0x33 = 00110011
|
||||||
o2 = _mm_blend_epi16(i252, i152, 0x33);
|
o2 = _mm_blend_epi16(i252, i152, 0x33);
|
||||||
|
Loading…
Reference in New Issue
Block a user