| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437 |
- /*
- Simple DirectMedia Layer
- Copyright (C) 1997-2026 Sam Lantinga <slouken@libsdl.org>
- This software is provided 'as-is', without any express or implied
- warranty. In no event will the authors be held liable for any damages
- arising from the use of this software.
- Permission is granted to anyone to use this software for any purpose,
- including commercial applications, and to alter it and redistribute it
- freely, subject to the following restrictions:
- 1. The origin of this software must not be misrepresented; you must not
- claim that you wrote the original software. If you use this software
- in a product, an acknowledgment in the product documentation would be
- appreciated but is not required.
- 2. Altered source versions must be plainly marked as such, and must not be
- misrepresented as being the original software.
- 3. This notice may not be removed or altered from any source distribution.
- */
- #include "SDL_internal.h"
- #include "SDL_surface_c.h"
- #ifdef SDL_SSE_INTRINSICS
- /* *INDENT-OFF* */ // clang-format off
- #if defined(_MSC_VER) && !defined(__clang__)
- #define SSE_BEGIN \
- __m128 c128; \
- c128.m128_u32[0] = color; \
- c128.m128_u32[1] = color; \
- c128.m128_u32[2] = color; \
- c128.m128_u32[3] = color
- #else
- #define SSE_BEGIN \
- __m128 c128; \
- DECLARE_ALIGNED(Uint32, cccc[4], 16); \
- cccc[0] = color; \
- cccc[1] = color; \
- cccc[2] = color; \
- cccc[3] = color; \
- c128 = *(__m128 *)cccc
- #endif
- #define SSE_WORK \
- for (i = n / 64; i--;) { \
- _mm_stream_ps((float *)(p+0), c128); \
- _mm_stream_ps((float *)(p+16), c128); \
- _mm_stream_ps((float *)(p+32), c128); \
- _mm_stream_ps((float *)(p+48), c128); \
- p += 64; \
- }
- #define SSE_END
- #define DEFINE_SSE_FILLRECT(bpp, type) \
- static void SDL_TARGETING("sse") SDL_FillSurfaceRect##bpp##SSE(Uint8 *pixels, int pitch, Uint32 color, int w, int h) \
- { \
- int i, n; \
- Uint8 *p = NULL; \
- \
- /* If the number of bytes per row is equal to the pitch, treat */ \
- /* all rows as one long continuous row (for better performance) */ \
- if ((w) * (bpp) == pitch) { \
- w = w * h; \
- h = 1; \
- } \
- \
- SSE_BEGIN; \
- \
- while (h--) { \
- n = (w) * (bpp); \
- p = pixels; \
- \
- if (n > 63) { \
- int adjust = 16 - ((uintptr_t)p & 15); \
- if (adjust < 16) { \
- n -= adjust; \
- adjust /= (bpp); \
- while (adjust--) { \
- *((type *)p) = (type)color; \
- p += (bpp); \
- } \
- } \
- SSE_WORK; \
- } \
- if (n & 63) { \
- int remainder = (n & 63); \
- remainder /= (bpp); \
- while (remainder--) { \
- *((type *)p) = (type)color; \
- p += (bpp); \
- } \
- } \
- pixels += pitch; \
- } \
- \
- SSE_END; \
- }
- static void SDL_TARGETING("sse") SDL_FillSurfaceRect1SSE(Uint8 *pixels, int pitch, Uint32 color, int w, int h)
- {
- int i, n;
- SSE_BEGIN;
- while (h--) {
- Uint8 *p = pixels;
- n = w;
- if (n > 63) {
- int adjust = 16 - ((uintptr_t)p & 15);
- if (adjust) {
- n -= adjust;
- SDL_memset(p, color, adjust);
- p += adjust;
- }
- SSE_WORK;
- }
- if (n & 63) {
- int remainder = (n & 63);
- SDL_memset(p, color, remainder);
- }
- pixels += pitch;
- }
- SSE_END;
- }
- // DEFINE_SSE_FILLRECT(1, Uint8)
- DEFINE_SSE_FILLRECT(2, Uint16)
- DEFINE_SSE_FILLRECT(4, Uint32)
- /* *INDENT-ON* */ // clang-format on
- #endif // __SSE__
- #ifdef SDL_LSX_INTRINSICS
- /* *INDENT-OFF* */ // clang-format off
- #define LSX_BEGIN __m128i c128 = __lsx_vreplgr2vr_w(color);
- #define LSX_WORK \
- for (i = n / 64; i--;) { \
- __lsx_vst(c128, p, 0); \
- __lsx_vst(c128, p, 16); \
- __lsx_vst(c128, p, 32); \
- __lsx_vst(c128, p, 48); \
- p += 64; \
- }
- #define DEFINE_LSX_FILLRECT(bpp, type) \
- static void SDL_TARGETING("lsx") SDL_FillSurfaceRect##bpp##LSX(Uint8 *pixels, int pitch, Uint32 color, int w, int h) \
- { \
- int i, n; \
- Uint8 *p = NULL; \
- \
- /* If the number of bytes per row is equal to the pitch, treat */ \
- /* all rows as one long continuous row (for better performance) */ \
- if ((w) * (bpp) == pitch) { \
- w = w * h; \
- h = 1; \
- } \
- \
- LSX_BEGIN; \
- \
- while (h--) { \
- n = (w) * (bpp); \
- p = pixels; \
- \
- if (n > 63) { \
- int adjust = 16 - ((uintptr_t)p & 15); \
- if (adjust < 16) { \
- n -= adjust; \
- adjust /= (bpp); \
- while (adjust--) { \
- *((type *)p) = (type)color; \
- p += (bpp); \
- } \
- } \
- LSX_WORK; \
- } \
- if (n & 63) { \
- int remainder = (n & 63); \
- remainder /= (bpp); \
- while (remainder--) { \
- *((type *)p) = (type)color; \
- p += (bpp); \
- } \
- } \
- pixels += pitch; \
- } \
- \
- }
- DEFINE_LSX_FILLRECT(4, Uint32)
- /* *INDENT-ON* */ // clang-format on
- #endif /* __LSX__ */
- static void SDL_FillSurfaceRect1(Uint8 *pixels, int pitch, Uint32 color, int w, int h)
- {
- int n;
- Uint8 *p = NULL;
- while (h--) {
- n = w;
- p = pixels;
- if (n > 3) {
- switch ((uintptr_t)p & 3) {
- case 1:
- *p++ = (Uint8)color;
- --n;
- SDL_FALLTHROUGH;
- case 2:
- *p++ = (Uint8)color;
- --n;
- SDL_FALLTHROUGH;
- case 3:
- *p++ = (Uint8)color;
- --n;
- }
- SDL_memset4(p, color, (n >> 2));
- }
- if (n & 3) {
- p += (n & ~3);
- switch (n & 3) {
- case 3:
- *p++ = (Uint8)color;
- SDL_FALLTHROUGH;
- case 2:
- *p++ = (Uint8)color;
- SDL_FALLTHROUGH;
- case 1:
- *p++ = (Uint8)color;
- }
- }
- pixels += pitch;
- }
- }
- static void SDL_FillSurfaceRect2(Uint8 *pixels, int pitch, Uint32 color, int w, int h)
- {
- int n;
- Uint16 *p = NULL;
- while (h--) {
- n = w;
- p = (Uint16 *)pixels;
- if (n > 1) {
- if ((uintptr_t)p & 2) {
- *p++ = (Uint16)color;
- --n;
- }
- SDL_memset4(p, color, (n >> 1));
- }
- if (n & 1) {
- p[n - 1] = (Uint16)color;
- }
- pixels += pitch;
- }
- }
- static void SDL_FillSurfaceRect3(Uint8 *pixels, int pitch, Uint32 color, int w, int h)
- {
- #if SDL_BYTEORDER == SDL_LIL_ENDIAN
- Uint8 b1 = (Uint8)(color & 0xFF);
- Uint8 b2 = (Uint8)((color >> 8) & 0xFF);
- Uint8 b3 = (Uint8)((color >> 16) & 0xFF);
- #elif SDL_BYTEORDER == SDL_BIG_ENDIAN
- Uint8 b1 = (Uint8)((color >> 16) & 0xFF);
- Uint8 b2 = (Uint8)((color >> 8) & 0xFF);
- Uint8 b3 = (Uint8)(color & 0xFF);
- #endif
- int n;
- Uint8 *p = NULL;
- while (h--) {
- n = w;
- p = pixels;
- while (n--) {
- *p++ = b1;
- *p++ = b2;
- *p++ = b3;
- }
- pixels += pitch;
- }
- }
- static void SDL_FillSurfaceRect4(Uint8 *pixels, int pitch, Uint32 color, int w, int h)
- {
- while (h--) {
- SDL_memset4(pixels, color, w);
- pixels += pitch;
- }
- }
- /*
- * This function performs a fast fill of the given rectangle with 'color'
- */
- bool SDL_FillSurfaceRect(SDL_Surface *dst, const SDL_Rect *rect, Uint32 color)
- {
- CHECK_PARAM(!SDL_SurfaceValid(dst)) {
- return SDL_InvalidParamError("SDL_FillSurfaceRect(): dst");
- }
- // If 'rect' == NULL, then fill the whole surface
- if (!rect) {
- rect = &dst->clip_rect;
- // Don't attempt to fill if the surface's clip_rect is empty
- if (SDL_RectEmpty(rect)) {
- return true;
- }
- }
- return SDL_FillSurfaceRects(dst, rect, 1, color);
- }
- bool SDL_FillSurfaceRects(SDL_Surface *dst, const SDL_Rect *rects, int count, Uint32 color)
- {
- SDL_Rect clipped;
- Uint8 *pixels;
- const SDL_Rect *rect;
- void (*fill_function)(Uint8 * pixels, int pitch, Uint32 color, int w, int h) = NULL;
- int i;
- CHECK_PARAM(!SDL_SurfaceValid(dst)) {
- return SDL_InvalidParamError("SDL_FillSurfaceRects(): dst");
- }
- CHECK_PARAM(!rects) {
- return SDL_InvalidParamError("SDL_FillSurfaceRects(): rects");
- }
- if (!dst->pixels && SDL_MUSTLOCK(dst)) {
- return SDL_SetError("SDL_FillSurfaceRects(): You must lock the surface");
- }
- // Nothing to do
- if (dst->w == 0 || dst->h == 0 || !dst->pixels) {
- return true;
- }
- /* This function doesn't usually work on surfaces < 8 bpp
- * Except: support for 4bits, when filling full size.
- */
- if (SDL_BITSPERPIXEL(dst->format) < 8) {
- if (count == 1) {
- const SDL_Rect *r = &rects[0];
- if (r->x == 0 && r->y == 0 && r->w == dst->w && r->h == dst->h) {
- if (SDL_BITSPERPIXEL(dst->format) == 4) {
- Uint8 b = (((Uint8)color << 4) | (Uint8)color);
- SDL_memset(dst->pixels, b, (size_t)dst->h * dst->pitch);
- return true;
- }
- }
- }
- return SDL_SetError("SDL_FillSurfaceRects(): Unsupported surface format");
- }
- if (fill_function == NULL) {
- switch (SDL_BYTESPERPIXEL(dst->format)) {
- case 1:
- {
- color |= (color << 8);
- color |= (color << 16);
- #ifdef SDL_SSE_INTRINSICS
- if (SDL_HasSSE()) {
- fill_function = SDL_FillSurfaceRect1SSE;
- break;
- }
- #endif
- fill_function = SDL_FillSurfaceRect1;
- break;
- }
- case 2:
- {
- color |= (color << 16);
- #ifdef SDL_SSE_INTRINSICS
- if (SDL_HasSSE()) {
- fill_function = SDL_FillSurfaceRect2SSE;
- break;
- }
- #endif
- fill_function = SDL_FillSurfaceRect2;
- break;
- }
- case 3:
- // 24-bit RGB is a slow path, at least for now.
- {
- fill_function = SDL_FillSurfaceRect3;
- break;
- }
- case 4:
- {
- #ifdef SDL_SSE_INTRINSICS
- if (SDL_HasSSE()) {
- fill_function = SDL_FillSurfaceRect4SSE;
- break;
- }
- #endif
- #ifdef SDL_LSX_INTRINSICS
- if (SDL_HasLSX()) {
- fill_function = SDL_FillSurfaceRect4LSX;
- break;
- }
- #endif
- fill_function = SDL_FillSurfaceRect4;
- break;
- }
- default:
- return SDL_SetError("Unsupported pixel format");
- }
- }
- for (i = 0; i < count; ++i) {
- rect = &rects[i];
- // Perform clipping
- if (!SDL_GetRectIntersection(rect, &dst->clip_rect, &clipped)) {
- continue;
- }
- rect = &clipped;
- pixels = (Uint8 *)dst->pixels + rect->y * dst->pitch +
- rect->x * SDL_BYTESPERPIXEL(dst->format);
- fill_function(pixels, dst->pitch, color, rect->w, rect->h);
- }
- // We're done!
- return true;
- }
|