|
| 1 | +"""Utility for detecting image formats from raw bytes.""" |
| 2 | + |
| 3 | +from resolver_athena_client.generated.athena.models_pb2 import ImageFormat |
| 4 | + |
| 5 | +PNG_MAGIC_BYTES = b"\x89PNG" |
| 6 | +JPEG_MAGIC_BYTES = b"\xff\xd8\xff" |
| 7 | +GIF87A_MAGIC_BYTES = b"GIF87a" |
| 8 | +GIF89A_MAGIC_BYTES = b"GIF89a" |
| 9 | +BMP_MAGIC_BYTES = b"BM" |
| 10 | +WEBP_RIFF_MAGIC_BYTES = b"RIFF" |
| 11 | +WEBP_WEBP_MAGIC_BYTES = b"WEBP" |
| 12 | +TIFF_LE_MAGIC_BYTES = b"II*\x00" |
| 13 | +TIFF_BE_MAGIC_BYTES = b"MM\x00*" |
| 14 | + |
| 15 | + |
| 16 | +def detect_image_format(data: bytes) -> ImageFormat.ValueType: # noqa: PLR0911 |
| 17 | + """Detect image format from raw bytes using magic number signatures. |
| 18 | +
|
| 19 | + Args: |
| 20 | + ---- |
| 21 | + data: Raw image bytes to analyze |
| 22 | +
|
| 23 | + Returns: |
| 24 | + ------- |
| 25 | + ImageFormat enum value representing the detected format |
| 26 | +
|
| 27 | + """ |
| 28 | + if not data: |
| 29 | + return ImageFormat.IMAGE_FORMAT_UNSPECIFIED |
| 30 | + |
| 31 | + # Check magic numbers for common image formats |
| 32 | + # PNG: starts with PNG_MAGIC_BYTES |
| 33 | + png_len = len(PNG_MAGIC_BYTES) |
| 34 | + if len(data) >= png_len and data[:png_len] == PNG_MAGIC_BYTES: |
| 35 | + return ImageFormat.IMAGE_FORMAT_PNG |
| 36 | + |
| 37 | + # JPEG: starts with JPEG_MAGIC_BYTES |
| 38 | + jpeg_len = len(JPEG_MAGIC_BYTES) |
| 39 | + if len(data) >= jpeg_len and data[:jpeg_len] == JPEG_MAGIC_BYTES: |
| 40 | + return ImageFormat.IMAGE_FORMAT_JPEG |
| 41 | + |
| 42 | + # GIF: starts with GIF87A_MAGIC_BYTES or GIF89A_MAGIC_BYTES |
| 43 | + gif_len = len(GIF87A_MAGIC_BYTES) |
| 44 | + if len(data) >= gif_len and data[:gif_len] in ( |
| 45 | + GIF87A_MAGIC_BYTES, |
| 46 | + GIF89A_MAGIC_BYTES, |
| 47 | + ): |
| 48 | + return ImageFormat.IMAGE_FORMAT_GIF |
| 49 | + |
| 50 | + # BMP: starts with BMP_MAGIC_BYTES |
| 51 | + bmp_len = len(BMP_MAGIC_BYTES) |
| 52 | + if len(data) >= bmp_len and data[:bmp_len] == BMP_MAGIC_BYTES: |
| 53 | + return ImageFormat.IMAGE_FORMAT_BMP |
| 54 | + |
| 55 | + # WebP: RIFF....WEBP (12 bytes minimum for full signature) |
| 56 | + webp_min_len = len(WEBP_RIFF_MAGIC_BYTES) + len(WEBP_WEBP_MAGIC_BYTES) + 4 |
| 57 | + if ( |
| 58 | + len(data) >= webp_min_len |
| 59 | + and data[:4] == WEBP_RIFF_MAGIC_BYTES |
| 60 | + and data[8:12] == WEBP_WEBP_MAGIC_BYTES |
| 61 | + ): |
| 62 | + return ImageFormat.IMAGE_FORMAT_WEBP |
| 63 | + |
| 64 | + # TIFF: little-endian or big-endian magic bytes |
| 65 | + tiff_len = len(TIFF_LE_MAGIC_BYTES) |
| 66 | + if len(data) >= tiff_len and ( |
| 67 | + data[:tiff_len] == TIFF_LE_MAGIC_BYTES |
| 68 | + or data[:tiff_len] == TIFF_BE_MAGIC_BYTES |
| 69 | + ): |
| 70 | + return ImageFormat.IMAGE_FORMAT_TIFF |
| 71 | + |
| 72 | + # Fallback when format cannot be determined |
| 73 | + return ImageFormat.IMAGE_FORMAT_UNSPECIFIED |
0 commit comments