changeset 3405:d5f2dd33f4eb

Merged improvements to SDL_SoftStretch() from SDL 1.2
author Sam Lantinga <slouken@libsdl.org>
date Sun, 18 Oct 2009 17:49:40 +0000
parents c9dcc73f6a36
children 8ae607392409
files configure.in include/SDL_config.h.in src/video/SDL_stretch.c
diffstat 3 files changed, 87 insertions(+), 51 deletions(-) [+]
line wrap: on
line diff
--- a/configure.in	Sun Oct 18 16:14:35 2009 +0000
+++ b/configure.in	Sun Oct 18 17:49:40 2009 +0000
@@ -204,6 +204,15 @@
     if test x$ac_cv_func_strtod = xyes; then
         AC_DEFINE(HAVE_STRTOD)
     fi
+    AC_CHECK_FUNC(mprotect,
+        AC_TRY_COMPILE([
+          #include <sys/types.h>
+          #include <sys/mman.h>
+        ],[
+        ],[
+        AC_DEFINE(HAVE_MPROTECT)
+        ]),
+    )
     AC_CHECK_FUNCS(malloc calloc realloc free getenv putenv unsetenv qsort abs bcopy memset memcpy memmove strlen strlcpy strlcat strdup _strrev _strupr _strlwr strchr strrchr strstr itoa _ltoa _uitoa _ultoa strtol strtoul _i64toa _ui64toa strtoll strtoull atoi atof strcmp strncmp _stricmp strcasecmp _strnicmp strncasecmp sscanf snprintf vsnprintf sigaction setjmp nanosleep)
 
     AC_CHECK_LIB(m, pow, [LIBS="$LIBS -lm"; EXTRA_LDFLAGS="$EXTRA_LDFLAGS -lm"])
--- a/include/SDL_config.h.in	Sun Oct 18 16:14:35 2009 +0000
+++ b/include/SDL_config.h.in	Sun Oct 18 17:49:40 2009 +0000
@@ -151,6 +151,7 @@
 #undef HAVE_NANOSLEEP
 #undef HAVE_CLOCK_GETTIME
 #undef HAVE_GETPAGESIZE
+#undef HAVE_MPROTECT
 
 #else
 /* We may need some replacement for stdarg.h here */
--- a/src/video/SDL_stretch.c	Sun Oct 18 16:14:35 2009 +0000
+++ b/src/video/SDL_stretch.c	Sun Oct 18 17:49:40 2009 +0000
@@ -42,6 +42,16 @@
 
 #ifdef USE_ASM_STRETCH
 
+#ifdef HAVE_MPROTECT
+#include <sys/types.h>
+#include <sys/mman.h>
+#endif
+#ifdef __GNUC__
+#define PAGE_ALIGNED __attribute__((__aligned__(4096)))
+#else
+#define PAGE_ALIGNED
+#endif
+
 #if defined(_M_IX86) || defined(i386)
 #define PREFIX16	0x66
 #define STORE_BYTE	0xAA
@@ -53,7 +63,7 @@
 #error Need assembly opcodes for this architecture
 #endif
 
-static unsigned char copy_row[4096];
+static unsigned char copy_row[4096] PAGE_ALIGNED;
 
 static int
 generate_rowbytes(int src_w, int dst_w, int bpp)
@@ -63,6 +73,7 @@
         int bpp;
         int src_w;
         int dst_w;
+        int status;
     } last;
 
     int i;
@@ -72,11 +83,12 @@
 
     /* See if we need to regenerate the copy buffer */
     if ((src_w == last.src_w) && (dst_w == last.dst_w) && (bpp == last.bpp)) {
-        return (0);
+        return (last.status);
     }
     last.bpp = bpp;
     last.src_w = src_w;
     last.dst_w = dst_w;
+    last.status = -1;
 
     switch (bpp) {
     case 1:
@@ -92,6 +104,13 @@
         SDL_SetError("ASM stretch of %d bytes isn't supported\n", bpp);
         return (-1);
     }
+#ifdef HAVE_MPROTECT
+    /* Make the code writeable */
+    if (mprotect(copy_row, sizeof(copy_row), PROT_READ | PROT_WRITE) < 0) {
+        SDL_SetError("Couldn't make copy buffer writeable");
+        return (-1);
+    }
+#endif
     pos = 0x10000;
     inc = (src_w << 16) / dst_w;
     eip = copy_row;
@@ -111,47 +130,55 @@
     }
     *eip++ = RETURN;
 
-    /* Verify that we didn't overflow (too late) */
+    /* Verify that we didn't overflow (too late!!!) */
     if (eip > (copy_row + sizeof(copy_row))) {
         SDL_SetError("Copy buffer overflow");
         return (-1);
     }
+#ifdef HAVE_MPROTECT
+    /* Make the code executable but not writeable */
+    if (mprotect(copy_row, sizeof(copy_row), PROT_READ | PROT_EXEC) < 0) {
+        SDL_SetError("Couldn't make copy buffer executable");
+        return (-1);
+    }
+#endif
+    last.status = 0;
     return (0);
 }
 
-#else
+#endif /* USE_ASM_STRETCH */
 
-#define DEFINE_COPY_ROW(name, type)                     \
-void name(type *src, int src_w, type *dst, int dst_w)   \
-{                                                       \
-    int i;                                              \
-    int pos, inc;                                       \
-    type pixel = 0;                                     \
-                                                        \
-    pos = 0x10000;                                      \
-    inc = (src_w << 16) / dst_w;                        \
-    for ( i=dst_w; i>0; --i ) {                         \
-        while ( pos >= 0x10000L ) {                     \
-            pixel = *src++;                             \
-            pos -= 0x10000L;                            \
-        }                                               \
-        *dst++ = pixel;                                 \
-        pos += inc;                                     \
-    }                                                   \
+#define DEFINE_COPY_ROW(name, type)			\
+void name(type *src, int src_w, type *dst, int dst_w)	\
+{							\
+	int i;						\
+	int pos, inc;					\
+	type pixel = 0;					\
+							\
+	pos = 0x10000;					\
+	inc = (src_w << 16) / dst_w;			\
+	for ( i=dst_w; i>0; --i ) {			\
+		while ( pos >= 0x10000L ) {		\
+			pixel = *src++;			\
+			pos -= 0x10000L;		\
+		}					\
+		*dst++ = pixel;				\
+		pos += inc;				\
+	}						\
 }
 /* *INDENT-OFF* */
 DEFINE_COPY_ROW(copy_row1, Uint8)
 DEFINE_COPY_ROW(copy_row2, Uint16)
 DEFINE_COPY_ROW(copy_row4, Uint32)
 /* *INDENT-ON* */
-#endif /* USE_ASM_STRETCH */
+
 /* The ASM code doesn't handle 24-bpp stretch blits */
 void
 copy_row3(Uint8 * src, int src_w, Uint8 * dst, int dst_w)
 {
     int i;
     int pos, inc;
-    Uint8 pixel[3];
+    Uint8 pixel[3] = { 0, 0, 0 };
 
     pos = 0x10000;
     inc = (src_w << 16) / dst_w;
@@ -186,9 +213,12 @@
     Uint8 *dstp;
     SDL_Rect full_src;
     SDL_Rect full_dst;
-#if defined(USE_ASM_STRETCH) && defined(__GNUC__)
+#ifdef USE_ASM_STRETCH
+    SDL_bool use_asm = SDL_TRUE;
+#ifdef __GNUC__
     int u1, u2;
 #endif
+#endif /* USE_ASM_STRETCH */
     const int bpp = dst->format->BytesPerPixel;
 
     if (src->format->BitsPerPixel != dst->format->BitsPerPixel) {
@@ -257,8 +287,8 @@
 
 #ifdef USE_ASM_STRETCH
     /* Write the opcodes for this stretch */
-    if ((bpp != 3) && (generate_rowbytes(srcrect->w, dstrect->w, bpp) < 0)) {
-        return (-1);
+    if ((bpp == 3) || (generate_rowbytes(srcrect->w, dstrect->w, bpp) < 0)) {
+        use_asm = SDL_FALSE;
     }
 #endif
 
@@ -273,13 +303,11 @@
             pos -= 0x10000L;
         }
 #ifdef USE_ASM_STRETCH
-        switch (bpp) {
-        case 3:
-            copy_row3(srcp, srcrect->w, dstp, dstrect->w);
-            break;
-        default:
+        if (use_asm) {
 #ifdef __GNUC__
-          __asm__ __volatile__("call *%4": "=&D"(u1), "=&S"(u2): "0"(dstp), "1"(srcp), "r"(copy_row):"memory");
+            __asm__ __volatile__("call *%4":"=&D"(u1), "=&S"(u2)
+                                 :"0"(dstp), "1"(srcp), "r"(copy_row)
+                                 :"memory");
 #elif defined(_MSC_VER) || defined(__WATCOMC__)
             /* *INDENT-OFF* */
             {
@@ -298,26 +326,24 @@
 #else
 #error Need inline assembly for this compiler
 #endif
-            break;
-        }
-#else
-        switch (bpp) {
-        case 1:
-            copy_row1(srcp, srcrect->w, dstp, dstrect->w);
-            break;
-        case 2:
-            copy_row2((Uint16 *) srcp, srcrect->w,
-                      (Uint16 *) dstp, dstrect->w);
-            break;
-        case 3:
-            copy_row3(srcp, srcrect->w, dstp, dstrect->w);
-            break;
-        case 4:
-            copy_row4((Uint32 *) srcp, srcrect->w,
-                      (Uint32 *) dstp, dstrect->w);
-            break;
-        }
+        } else
 #endif
+            switch (bpp) {
+            case 1:
+                copy_row1(srcp, srcrect->w, dstp, dstrect->w);
+                break;
+            case 2:
+                copy_row2((Uint16 *) srcp, srcrect->w,
+                          (Uint16 *) dstp, dstrect->w);
+                break;
+            case 3:
+                copy_row3(srcp, srcrect->w, dstp, dstrect->w);
+                break;
+            case 4:
+                copy_row4((Uint32 *) srcp, srcrect->w,
+                          (Uint32 *) dstp, dstrect->w);
+                break;
+            }
         pos += inc;
     }