From 5a079a2d114f96d4847d1ee305d5b7c16eeec50e Mon Sep 17 00:00:00 2001 From: 3gg <3gg@shellblade.net> Date: Sat, 27 Dec 2025 12:03:39 -0800 Subject: Initial commit --- contrib/SDL-3.2.8/src/video/SDL_blit_copy.c | 110 ++++++++++++++++++++++++++++ 1 file changed, 110 insertions(+) create mode 100644 contrib/SDL-3.2.8/src/video/SDL_blit_copy.c (limited to 'contrib/SDL-3.2.8/src/video/SDL_blit_copy.c') diff --git a/contrib/SDL-3.2.8/src/video/SDL_blit_copy.c b/contrib/SDL-3.2.8/src/video/SDL_blit_copy.c new file mode 100644 index 0000000..05ce0a4 --- /dev/null +++ b/contrib/SDL-3.2.8/src/video/SDL_blit_copy.c @@ -0,0 +1,110 @@ +/* + Simple DirectMedia Layer + Copyright (C) 1997-2025 Sam Lantinga + + This software is provided 'as-is', without any express or implied + warranty. In no event will the authors be held liable for any damages + arising from the use of this software. + + Permission is granted to anyone to use this software for any purpose, + including commercial applications, and to alter it and redistribute it + freely, subject to the following restrictions: + + 1. The origin of this software must not be misrepresented; you must not + claim that you wrote the original software. If you use this software + in a product, an acknowledgment in the product documentation would be + appreciated but is not required. + 2. Altered source versions must be plainly marked as such, and must not be + misrepresented as being the original software. + 3. This notice may not be removed or altered from any source distribution. +*/ +#include "SDL_internal.h" + +#include "SDL_surface_c.h" +#include "SDL_blit_copy.h" + +#ifdef SDL_SSE_INTRINSICS +// This assumes 16-byte aligned src and dst +static SDL_INLINE void SDL_TARGETING("sse") SDL_memcpySSE(Uint8 *dst, const Uint8 *src, int len) +{ + int i; + + __m128 values[4]; + for (i = len / 64; i--;) { + _mm_prefetch((const char *)src, _MM_HINT_NTA); + values[0] = *(__m128 *)(src + 0); + values[1] = *(__m128 *)(src + 16); + values[2] = *(__m128 *)(src + 32); + values[3] = *(__m128 *)(src + 48); + _mm_stream_ps((float *)(dst + 0), values[0]); + _mm_stream_ps((float *)(dst + 16), values[1]); + _mm_stream_ps((float *)(dst + 32), values[2]); + _mm_stream_ps((float *)(dst + 48), values[3]); + src += 64; + dst += 64; + } + + if (len & 63) { + SDL_memcpy(dst, src, len & 63); + } +} +#endif // SDL_SSE_INTRINSICS + +void SDL_BlitCopy(SDL_BlitInfo *info) +{ + bool overlap; + Uint8 *src, *dst; + int w, h; + int srcskip, dstskip; + + w = info->dst_w * info->dst_fmt->bytes_per_pixel; + h = info->dst_h; + src = info->src; + dst = info->dst; + srcskip = info->src_pitch; + dstskip = info->dst_pitch; + + // Properly handle overlapping blits + if (src < dst) { + overlap = (dst < (src + h * srcskip)); + } else { + overlap = (src < (dst + h * dstskip)); + } + if (overlap) { + if (dst < src) { + while (h--) { + SDL_memmove(dst, src, w); + src += srcskip; + dst += dstskip; + } + } else { + src += ((h - 1) * srcskip); + dst += ((h - 1) * dstskip); + while (h--) { + SDL_memmove(dst, src, w); + src -= srcskip; + dst -= dstskip; + } + } + return; + } + +#ifdef SDL_SSE_INTRINSICS + if (SDL_HasSSE() && + !((uintptr_t)src & 15) && !(srcskip & 15) && + !((uintptr_t)dst & 15) && !(dstskip & 15)) { + while (h--) { + SDL_memcpySSE(dst, src, w); + src += srcskip; + dst += dstskip; + } + return; + } +#endif + + while (h--) { + SDL_memcpy(dst, src, w); + src += srcskip; + dst += dstskip; + } +} -- cgit v1.2.3