libretro
diff --git a/‎.github/workflows/Linux-libretro-common-samples.yml‎
Lines changed: 2 additions & 0 deletions b/‎.github/workflows/Linux-libretro-common-samples.yml‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎libretro-common/formats/bmp/rbmp.c‎
Lines changed: 43 additions & 6 deletions b/‎libretro-common/formats/bmp/rbmp.c‎
Lines changed: 43 additions & 6 deletions
diff --git a/‎libretro-common/formats/tga/rtga.c‎
Lines changed: 68 additions & 9 deletions b/‎libretro-common/formats/tga/rtga.c‎
Lines changed: 68 additions & 9 deletions
diff --git a/‎libretro-common/samples/formats/bmp/Makefile‎
Lines changed: 24 additions & 0 deletions b/‎libretro-common/samples/formats/bmp/Makefile‎
Lines changed: 24 additions & 0 deletions
@@ -56,6 +56,8 @@ jobs:
             cdrom_cuesheet_overflow_test
             http_parse_test
             rjson_test
+            rtga_test
+            rbmp_test
           )
 
           # Per-binary run command (overrides ./<binary> if present).
 
@@ -28,6 +28,7 @@
 #include <stddef.h> /* ptrdiff_t on osx */
 #include <stdlib.h>
 #include <string.h>
+#include <limits.h> /* INT_MAX */
 
 #include <retro_inline.h>
 
@@ -66,13 +67,20 @@ static INLINE unsigned char rbmp_get8(rbmp_context *s)
 
 static void rbmp_skip(rbmp_context *s, int n)
 {
+   ptrdiff_t remaining;
    if (n < 0)
    {
       s->img_buffer = s->img_buffer_end;
       return;
    }
-
-   s->img_buffer += n;
+   /* Clamp to remaining input to avoid pointer arithmetic beyond
+    * img_buffer_end (UB per C99).  Subsequent rbmp_get8 calls
+    * check "buffer < buffer_end" and parse as EOF. */
+   remaining = s->img_buffer_end - s->img_buffer;
+   if ((ptrdiff_t)n > remaining)
+      s->img_buffer = s->img_buffer_end;
+   else
+      s->img_buffer += n;
 }
 
 static int rbmp_get16le(rbmp_context *s)
@@ -193,8 +201,16 @@ static uint32_t *rbmp_bmp_load(rbmp_context *s, unsigned *x, unsigned *y,
    if (bpp == 1)
       return 0;
 
+   /* img_y can legitimately be a negative int (top-down BMP).
+    * Pre-patch the code did abs((int)s->img_y) -- if the uint32
+    * happened to be 0x80000000, the cast to int is INT_MIN and
+    * abs(INT_MIN) is undefined behaviour.  Detect that case and
+    * treat as bottom-up zero-height (rejected by the overflow
+    * guard below). */
+   if (s->img_y == 0x80000000u)
+      return 0;
    flip_vertically = ((int) s->img_y) > 0;
-   s->img_y        = abs((int) s->img_y);
+   s->img_y        = (uint32_t)abs((int) s->img_y);
 
    if (hsz == 12)
    {
@@ -298,8 +314,25 @@ static uint32_t *rbmp_bmp_load(rbmp_context *s, unsigned *x, unsigned *y,
    }
    s->img_n = ma ? 4 : 3;
 
-   /* Always output as uint32 (4 bytes per pixel) */
-   output = (uint32_t*)malloc(s->img_x * s->img_y * sizeof(uint32_t));
+   /* Always output as uint32 (4 bytes per pixel).
+    *
+    * Pre-patch this multiplied two uint32_t dimensions at uint32_t
+    * width, so img_x * img_y silently wrapped on 32-bit -- e.g.
+    * 0x10001 * 0x10000 = 0x100010000 wraps to 0x10000, and the
+    * subsequent malloc returned a 256 KiB buffer that the pixel
+    * decode loop wrote off the end of (4 GiB+ of writes).  Do
+    * the multiplication in size_t with an explicit ceiling:
+    * 0x4000 x 0x4000 = 256 M pixels = 1 GiB of decoded RGBA is
+    * far beyond any realistic libretro asset, and rejecting at
+    * that ceiling blocks the overflow case AND avoids giving a
+    * malicious BMP a direct route to a multi-GiB allocation
+    * attempt. */
+   if (s->img_x == 0 || s->img_y == 0)
+      return 0;
+   if (s->img_x > 0x4000u || s->img_y > 0x4000u)
+      return 0;
+   output = (uint32_t*)malloc(
+         (size_t)s->img_x * (size_t)s->img_y * sizeof(uint32_t));
    if (!output)
       return 0;
 
@@ -342,7 +375,11 @@ static uint32_t *rbmp_bmp_load(rbmp_context *s, unsigned *x, unsigned *y,
       for (j = 0; j < (int)s->img_y; ++j)
       {
          int dst_row = flip_vertically ? (int)(s->img_y - 1 - j) : j;
-         uint32_t *dst = output + dst_row * s->img_x;
+         /* Use size_t for the row-stride offset.  dst_row *
+          * s->img_x in signed-int could overflow for a legitimate
+          * 2 GiB BMP (e.g. 46341 x 46341).  Post-patch the
+          * pointer math matches the size_t-based allocation. */
+         uint32_t *dst = output + (size_t)dst_row * (size_t)s->img_x;
          int col = 0;
 
          for (i = 0; i < (int)s->img_x; i += 2)
 
@@ -28,6 +28,7 @@
 #include <stddef.h> /* ptrdiff_t on osx */
 #include <stdlib.h>
 #include <string.h>
+#include <limits.h> /* INT_MAX, SIZE_MAX via stdint */
 
 #include <retro_inline.h>
 
@@ -60,12 +61,24 @@ static INLINE uint8_t rtga_get8(rtga_context *s)
 
 static void rtga_skip(rtga_context *s, int n)
 {
+   ptrdiff_t remaining;
    if (n < 0)
    {
       s->img_buffer = s->img_buffer_end;
       return;
    }
-   s->img_buffer += n;
+   /* Clamp the advance to the remaining input.  Pre-patch a large
+    * attacker-supplied offset (TGA header byte 1, or palette
+    * start) pushed img_buffer past img_buffer_end, which is
+    * pointer arithmetic outside the allocated object (UB per C99).
+    * All callers of rtga_get8 check "buffer < buffer_end" so the
+    * clamped state parses as EOF and the subsequent header checks
+    * or indexed-palette code fail cleanly. */
+   remaining = s->img_buffer_end - s->img_buffer;
+   if ((ptrdiff_t)n > remaining)
+      s->img_buffer = s->img_buffer_end;
+   else
+      s->img_buffer += n;
 }
 
 static int rtga_get16le(rtga_context *s)
@@ -121,17 +134,48 @@ static uint32_t *rtga_tga_load(rtga_context *s,
       )
       return NULL;
 
-   /*   If paletted, then we will use the number of bits from the palette */
+   /*   If paletted, then we will use the number of bits from the palette.
+    *
+    *   tga_palette_bits is attacker-controlled (TGA byte 7, 0..255).
+    *   Pre-patch the indexed-read loop below did
+    *       for (j = 0; j * 8 < tga_palette_bits; ++j)
+    *           raw_data[j] = tga_palette[pal_idx + j];
+    *   raw_data is a 4-byte stack array, so tga_palette_bits > 32
+    *   wrote past the end of raw_data -- a stack buffer overflow of
+    *   up to 28 bytes, directly driven by the TGA header.  Reject
+    *   bogus palette_bits / empty palettes here and everything
+    *   downstream runs with bounded buffers. */
    if (tga_indexed)
+   {
+      if (    tga_palette_len < 1
+           || (    tga_palette_bits != 15
+                && tga_palette_bits != 16
+                && tga_palette_bits != 24
+                && tga_palette_bits != 32))
+         return NULL;
       tga_comp = tga_palette_bits / 8;
+   }
 
    /*   TGA info */
    *x = tga_width;
    *y = tga_height;
    if (comp)
       *comp = tga_comp;
 
-   output = (uint32_t*)malloc((size_t)tga_width * tga_height * sizeof(uint32_t));
+   /* Bound the output allocation.  TGA dimensions are attacker-
+    * controlled 16-bit values (max 65535), so their product is
+    * up to ~4.29 G pixels.  Pre-patch a 32-bit build could wrap
+    * (size_t)w * h * sizeof(uint32_t) to a small positive size_t
+    * and the per-pixel decode ran off the undersized malloc.
+    * Reject dimensions beyond a sane ceiling so the allocation
+    * never grows anywhere near wrap territory and hostile
+    * headers cannot drive the client into a multi-GiB malloc
+    * attempt.  0x4000 x 0x4000 = 1 GiB of decoded RGBA,
+    * comfortably larger than any real-world libretro asset. */
+   if (tga_width > 0x4000 || tga_height > 0x4000)
+      return NULL;
+   output = (uint32_t*)malloc(
+         (size_t)tga_width * (size_t)tga_height * sizeof(uint32_t));
    if (!output)
       return NULL;
 
@@ -226,19 +270,23 @@ static uint32_t *rtga_tga_load(rtga_context *s,
       int cur_col                = 0;
       int cur_row                = 0;
 
-      /* Load palette if indexed */
+      /* Load palette if indexed.  Header-level checks above have
+       * ensured tga_palette_len >= 1 and tga_palette_bits in
+       * {15,16,24,32}, so n is positive and bounded at
+       * 65535 * 32 / 8 = 262140 bytes -- fits comfortably in int
+       * and in the input length we've already accepted. */
       if (tga_indexed)
       {
          int n;
          rtga_skip(s, tga_palette_start);
-         tga_palette = (unsigned char*)malloc(tga_palette_len * tga_palette_bits / 8);
+         n = tga_palette_len * tga_palette_bits / 8;
+         tga_palette = (unsigned char*)malloc((size_t)n);
          if (!tga_palette)
          {
             free(output);
             return NULL;
          }
-         n = tga_palette_len * tga_palette_bits / 8;
-         if (s->img_buffer + n <= s->img_buffer_end)
+         if (s->img_buffer_end - s->img_buffer >= (ptrdiff_t)n)
          {
             memcpy(tga_palette, s->img_buffer, n);
             s->img_buffer += n;
@@ -325,9 +373,11 @@ static uint32_t *rtga_tga_load(rtga_context *s,
                   | ((uint32_t)g << 8)  | (uint32_t)b;
 
          /* Write to correct position using tracked row/col
-          * (avoids per-pixel division and modulo) */
+          * (avoids per-pixel division and modulo).  Use size_t for
+          * the index so dst_row * tga_width does not overflow
+          * signed int for a legitimate 65535 x 65535 image. */
          dst_row = tga_inverted ? (tga_height - 1 - cur_row) : cur_row;
-         output[dst_row * tga_width + cur_col] = pixel;
+         output[(size_t)dst_row * (size_t)tga_width + (size_t)cur_col] = pixel;
 
          if (++cur_col >= tga_width)
          {
@@ -366,6 +416,15 @@ int rtga_process_image(rtga_t *rtga, void **buf_data,
    if (!rtga)
       return IMAGE_PROCESS_ERROR;
 
+   /* Reject sizes that don't fit in int before casting.  A TGA
+    * file larger than INT_MAX handed to an int-taking API would
+    * truncate, the truncated value (potentially negative)
+    * propagated to img_buffer_end = buffer + len, producing
+    * pointer arithmetic outside the source object (UB).  A 2 GiB
+    * TGA is unreasonable; reject early. */
+   if (size > (size_t)INT_MAX)
+      return IMAGE_PROCESS_ERROR;
+
    rtga->output_image   = rtga_load_from_memory(rtga->buff_data,
                            (int)size, width, height, &comp, supports_rgba);
    *buf_data             = rtga->output_image;
 
@@ -0,0 +1,24 @@
+TARGET := rbmp_test
+
+LIBRETRO_COMM_DIR := ../../..
+
+SOURCES := \
+	rbmp_test.c \
+	$(LIBRETRO_COMM_DIR)/formats/bmp/rbmp.c
+
+OBJS := $(SOURCES:.c=.o)
+
+CFLAGS += -Wall -pedantic -std=gnu99 -g -I$(LIBRETRO_COMM_DIR)/include
+
+all: $(TARGET)
+
+%.o: %.c
+	$(CC) -c -o $@ $< $(CFLAGS)
+
+$(TARGET): $(OBJS)
+	$(CC) -o $@ $^ $(LDFLAGS)
+
+clean:
+	rm -f $(TARGET) $(OBJS)
+
+.PHONY: clean
Original file line number	Diff line number	Diff line change
`@@ -56,6 +56,8 @@ jobs:`
`56`	`56`	`cdrom_cuesheet_overflow_test`
`57`	`57`	`http_parse_test`
`58`	`58`	`rjson_test`
	`59`	`+ rtga_test`
	`60`	`+ rbmp_test`
`59`	`61`	`)`
`60`	`62`
`61`	`63`	`# Per-binary run command (overrides ./<binary> if present).`