Handle file extensions vs PIL format IDs

They usually correspond very closely, like .png -> PNG, but are are more distinct for some formats, like .jp2 -> JPEG2000. - Handle formats like JPEG2000 that differ in name from the extension. - Bring my own file ext handling in line with PIL: use dotted lowercase. - Raise an exception when a file format is detected but not supporting for reading or for writing, depending on the attempted operation.
2025-01-02 03:48:20 +03:00 · 2023-05-15 14:23:58 -04:00 · 2023-05-15 14:23:58 -04:00 · 9653bfd9d8
commit 9653bfd9d8
parent 1176fcee73
1 changed files with 27 additions and 25 deletions
--- a/src/textual_paint/paint.py
+++ b/src/textual_paint/paint.py
@ -828,32 +828,31 @@ class AnsiArtDocument:
    def encode_based_on_file_extension(self, file_path: str) -> bytes:
        """Encode the image according to the file extension."""
-        file_type = os.path.splitext(file_path)[1][1:].upper()
+        file_ext_with_dot = os.path.splitext(file_path)[1].lower()
-        print("File extension (normalized to uppercase):", file_type)
+        print("File extension:", file_ext_with_dot)
-        exts = Image.registered_extensions()
+        ext_to_id = Image.registered_extensions() # maps extension to format ID, e.g. '.jp2': 'JPEG2000' (most format IDs are similar to the extension)
        supported_extensions = [ext[1:].upper() for ext, f in exts.items() if f in Image.SAVE]
        print("Supported image formats by extension:", Image.EXTENSION)
-        print("Supported image formats:", Image.SAVE)
+        print("Supported image formats for writing:", Image.SAVE)
-        print("Supported image format file extensions:", supported_extensions)
+        if file_ext_with_dot == ".svg":
        if file_type == "SVG":
            return self.get_svg().encode("utf-8")
-        elif file_type == "HTML" or file_type == "HTM":
+        elif file_ext_with_dot == ".html" or file_ext_with_dot == ".htm":
            return self.get_html().encode("utf-8")
-        elif file_type == "TXT":
+        elif file_ext_with_dot == ".txt":
            return self.get_plain().encode("utf-8")
-        elif file_type == "_RICH_CONSOLE_MARKUP":
+        elif file_ext_with_dot == "._rich_console_markup":
            return self.get_rich_console_markup().encode("utf-8")
-        elif file_type in supported_extensions:
+        elif file_ext_with_dot in ext_to_id:
-            return self.encode_image_format(file_type)
+            if ext_to_id[file_ext_with_dot] in Image.SAVE:
                return self.encode_image_format(ext_to_id[file_ext_with_dot])
            raise Exception("Image format not supported for writing: " + ext_to_id[file_ext_with_dot])
        else:
-            if file_type not in ["ANS", "NFO"]:
+            if file_ext_with_dot not in [".ans", ".nfo"]:
                print("Falling back to ANSI")
                # TODO: show message to user instead of silently using a different format
                # This is especially important now that we have read-only formats like .CUR
            # This maybe shouldn't use UTF-8...
            return self.get_ansi().encode("utf-8")
-    def encode_image_format(self, file_type: str) -> bytes:
+    def encode_image_format(self, pil_format_id: str) -> bytes:
        """Encode the document as an image file."""
        size = (self.width, self.height)
        image = Image.new("RGB", size, color="#000000")
@ -863,11 +862,8 @@ class AnsiArtDocument:
            for x in range(self.width):
                color = Color.parse(self.bg[y][x])
                pixels[x, y] = (color.r, color.g, color.b)
        file_type = file_type.lower()
        if file_type == "jpg":
            file_type = "jpeg"
        buffer = io.BytesIO()
-        image.save(buffer, file_type, lossless=True)
+        image.save(buffer, pil_format_id, lossless=True)
        return buffer.getvalue()
    def get_ansi(self) -> str:
@ -1132,12 +1128,18 @@ class AnsiArtDocument:
    @staticmethod
    def decode_based_on_file_extension(content: bytes, file_path: str, default_bg: str = "#ffffff", default_fg: str = "#000000") -> 'AnsiArtDocument':
        """Creates a document from the given bytes, detecting the file format."""
-        file_type = os.path.splitext(file_path)[1][1:].upper()
+
-        exts = Image.registered_extensions()
+        file_ext_with_dot = os.path.splitext(file_path)[1].lower()
-        supported_extensions = [ext[1:].upper() for ext, f in exts.items() if f in Image.OPEN]
+        print("File extension:", file_ext_with_dot)
-        print("Supported extensions for loading images:", supported_extensions)
+        ext_to_id = Image.registered_extensions() # maps extension to format ID, e.g. '.jp2': 'JPEG2000' (most format IDs are similar to the extension)
-        if file_type in supported_extensions:
+        print("Supported image formats by extension:", Image.EXTENSION)
-            return AnsiArtDocument.from_image_format(content)
+        print("Supported image formats for reading:", Image.OPEN)
        # TODO: try loading as image first, then as text if that fails with UnidentifiedImageError
        # That way it can handle images without file extensions.
        if file_ext_with_dot in ext_to_id:
            if ext_to_id[file_ext_with_dot] in Image.OPEN:
                return AnsiArtDocument.from_image_format(content)
            raise Exception("Image format not supported for reading: " + ext_to_id[file_ext_with_dot])
        else:
            return AnsiArtDocument.from_text(content.decode('utf-8'), default_bg, default_fg)