LZW Compression 🍬

Karanraj06 · Apr 20, 2023 · 628ac65 · 628ac65
1 parent e369013
commit 628ac65
Show file tree

Hide file tree

Showing 4 changed files with 300 additions and 2 deletions.
diff --git a/Image Compression.pdf b/Image Compression.pdf
diff --git a/LZW Compression.pdf b/LZW Compression.pdf
diff --git a/jpeg_compression.py b/jpeg_compression.py
@@ -439,11 +439,22 @@ def plot_graph(
     plot_images function plots the original and compressed images
     Also, it wries the encoded images to a text file encoded_image.txt
     """
-    # plot_images(*analyze_image("path/to/your/image", 8, 10, color=True))
+    # plot_images(*analyze_image(img_path="path/to/your/image", block_size=8, num_coefficients=10, color=True))
 
     """
     Replaces the images folder with the path to your images folder
     plot_graph function plots the PSNR vs Compression Ratio graph
     for all the images in the images folder for different values of num_coefficients
     """
-    # plot_graph("path/to/your/image/folder", color=False)
+    # plot_graph(img_dir_path="path/to/your/image/folder", color=False)
+
+    if input("Analyze a single image (y/n): ") == "y":
+        img_path = input("Enter the path to the image: ")
+        block_size = int(input("Enter the block size (even): "))
+        num_coefficients = int(input("Enter the number of coefficients passed: "))
+        color = input("Is the image color (y/n): ") == "y"
+        plot_images(*analyze_image(img_path, block_size, num_coefficients, color))
+    elif input("Analyzes all images in a folder (y/n): ") == "y":
+        img_dir_path = input("Enter the path to the images folder: ")
+        color = input("Are the images color (y/n): ") == "y"
+        plot_graph(img_dir_path, color)
diff --git a/lzw_compression.py b/lzw_compression.py
@@ -0,0 +1,287 @@
+# Import the required modules
+import cv2 as cv
+import math
+import matplotlib.pyplot as plt
+import numpy as np
+
+
+def get_compression_ratio(
+    encoded_img: list[list[int]],
+    height: int,
+    width: int,
+    block_size: int,
+    max_dict_size: int,
+) -> float:
+    """
+    Calculates the compression ratio of the encoded image
+
+    Parameters:
+        encoded_img (list of LZW encoded blocks): list[list[int]]
+        height (height of the image): int
+        width (width of the image): int
+        block_size (size of the blocks): int
+        max_dict_size (maximum dictionary size): int
+
+    Returns:
+        compression_ratio (compression ratio of the encoded image): float
+    """
+    if block_size < 1 or block_size > min(height, width):
+        block_size = min(height, width)
+
+    # Calculate the padded height and width of the image
+    padded_height = height + (block_size - height % block_size) % block_size
+    padded_width = width + (block_size - width % block_size) % block_size
+
+    # Calculate the number of bits used in the original image
+    bits_in_original_img = padded_height * padded_width * 8
+
+    # Calculate the number of bits used in the encoded image
+    bits_in_encoded_img = 0
+    for block in encoded_img:
+        bits_in_encoded_img += len(block)
+
+    bits_in_encoded_img *= math.ceil(math.log2(max_dict_size))
+
+    # Calculate the compression ratio
+    compression_ratio = bits_in_original_img / bits_in_encoded_img
+
+    return compression_ratio
+
+
+def f(img: np.ndarray[np.uint8]) -> tuple[float, float]:
+    """
+    Calculates the entropy and maximum achievable compression of the image
+
+    Parameters:
+        img (grayscale image): np.ndarray[np.uint8]
+
+    Returns:
+        entropy (entropy of the image): float
+        max_compression (maximum achievable compression of the image): float
+    """
+    # Calculate the number of times each of the unique values comes up in the original image and store it in counts
+    _, counts = np.unique(img, return_counts=True)
+
+    # Normalize the counts by dividing them with the total number of pixels in the image
+    counts = counts.astype(np.float64)
+    counts /= img.size
+
+    # Calculate the entropy of the image using the normalized counts
+    entropy = -np.sum(counts * np.log2(counts))
+
+    # Calculate the maximum achievable compression of the image
+    max_compression = 8 / entropy
+    return entropy, max_compression
+
+
+def lzw_encoder(
+    img: np.ndarray[np.uint8], block_size: int, max_dict_size: int
+) -> tuple[list[list[int]], int]:
+    """
+    Encodes a grayscale image using LZW compression
+
+    Parameters:
+        img (grayscale image): np.ndarray[np.uint8]
+        block_size (size of the blocks): int
+        max_dict_size (maximum dictionary size): int
+
+    Returns:
+        encoded_img (list of LZW encoded blocks): list[list[int]]
+        max_dict_filled (maximum dictionary code used): int
+    """
+    height, width = img.shape
+
+    if block_size < 1 or block_size > min(height, width):
+        block_size = min(height, width)
+
+    # Perform zero padding to make the image dimensions divisible by the block size
+    padded_height = height + (block_size - height % block_size) % block_size
+    padded_width = width + (block_size - width % block_size) % block_size
+    padded_img = np.zeros((padded_height, padded_width), dtype=np.uint8)
+    padded_img[:height, :width] = img
+
+    # Split the image into blocks
+    blocks = [
+        padded_img[i : i + block_size, j : j + block_size]
+        for i in range(0, padded_height, block_size)
+        for j in range(0, padded_width, block_size)
+    ]
+
+    # Initialize variables for the output
+    encoded_img = []
+    max_dict_filled = 255
+
+    # Iterate over all blocks and apply LZW compression
+    for block in blocks:
+        # Initialize variables for the current block
+        # Code dictionary to store the codes for the recognized patterns in the current block
+        code_dict = dict((chr(i), i) for i in range(256))
+
+        # List to store the encoded output for the current block
+        encoded_block = []
+
+        # String to store the currently recognized pattern
+        currently_recognized = ""
+
+        # Variable to store the encoded output for the currently recognized pattern
+        encoded_output = None
+
+        # Iterate over all pixels in the block
+        for pixel in block.flatten():
+            # Add the pixel to the currently recognized pattern
+            currently_recognized += chr(pixel)
+
+            if currently_recognized in code_dict:
+                # If the currently recognized pattern is in the code dictionary, store the encoded output for the currently recognized pattern
+                encoded_output = code_dict[currently_recognized]
+            else:
+                # If the currently recognized pattern is not in the code dictionary, store the encoded output for the previously recognized pattern
+                encoded_block.append(encoded_output)
+                if len(code_dict) < max_dict_size:
+                    # Add the currently recognized pattern to the code dictionary
+                    code_dict[currently_recognized] = len(code_dict)
+                    max_dict_filled = max(max_dict_filled, len(code_dict) - 1)
+
+                # Reset the currently recognized pattern
+                currently_recognized = chr(pixel)
+                encoded_output = code_dict[currently_recognized]
+
+        # Store the encoded output for the last recognized pattern
+        if currently_recognized in code_dict:
+            encoded_output = code_dict[currently_recognized]
+
+        encoded_block.append(encoded_output)
+
+        # Add the encoded block to the encoded image
+        encoded_img.append(encoded_block)
+
+    return encoded_img, max_dict_filled
+
+
+def lzw_decoder(
+    encoded_img: list[list[int]],
+    height: int,
+    width: int,
+    block_size: int,
+    max_dict_size: int,
+) -> np.ndarray[np.uint8]:
+    """
+    Decodes a grayscale image using LZW compression
+
+    Parameters:
+        encoded_img (list of LZW encoded blocks): list[np.ndarray[np.int32]]
+        height (height of the image): int
+        width (width of the image): int
+        block_size (size of the blocks): int
+        max_dict_size (maximum dictionary size): int
+
+    Returns:
+        decoded_img (decoded image): np.ndarray[np.uint8]
+    """
+    if block_size < 1 or block_size > min(height, width):
+        block_size = min(height, width)
+
+    # Calculate the padded height and width of the image
+    padded_height = height + (block_size - height % block_size) % block_size
+    padded_width = width + (block_size - width % block_size) % block_size
+
+    # Create a numpy array to store the decoded image
+    decoded_img = np.zeros((padded_height, padded_width), dtype=np.uint8)
+
+    # Initialize a counter to keep track of the current block being processed
+    counter = 0
+
+    # Iterate over all blocks in the encoded image
+    for i in range(0, padded_height, block_size):
+        for j in range(0, padded_width, block_size):
+            # Initialize variables for the current block
+            # List to store the decoded output for the current block
+            decoded_block = []
+
+            # List to store the decoded output for the previous code
+            decoded = []
+
+            # Dictionary to store the code dictionary for the current block
+            code_dict = dict((i, [i]) for i in range(256))
+
+            # Iterate over all codes in the current block
+            for code in encoded_img[counter]:
+                # If the code is not in the code dictionary, add it
+                if code not in code_dict:
+                    code_dict[code] = decoded + [decoded[0]]
+
+                # Add the decoded output for the current code to the decoded block
+                decoded_block += code_dict[code]
+
+                # If the dictionary is not full and the decoded output for the previous code + the first output for the current code is not in the code dictionary, add it
+                if (
+                    0 < len(code_dict) < max_dict_size
+                    and decoded + [code_dict[code][0]] not in code_dict.values()
+                ):
+                    code_dict[len(code_dict)] = decoded + [code_dict[code][0]]
+
+                # Update the decoded output for the previous code
+                decoded = code_dict[code]
+
+            # Reshape the decoded block and store it in the decoded image
+            decoded_img[i : i + block_size, j : j + block_size] = np.array(
+                decoded_block, dtype=np.uint8
+            ).reshape(block_size, block_size)
+
+            # Increment the counter to move on to the next block
+            counter += 1
+
+    # Return the decoded image with the correct height and width
+    return decoded_img[:height, :width]
+
+
+if __name__ == "__main__":
+    # Read the input image in grayscale
+    img = cv.imread(input("Enter the path to the image: "), cv.IMREAD_GRAYSCALE)
+
+    # Calculate the entropy and maximum achievable compression ratio of the input image
+    entropy, max_compression = f(img)
+
+    # Get the height and width of the input image
+    height, width = img.shape
+
+    # Get the block size for LZW encoding
+    block_size = int(input("Enter the block size: "))
+
+    # Get the maximum dictionary size for LZW encoding
+    max_dict_size = int(input("Enter the maximum dictionary size: "))
+
+    # Encode the input image using LZW encoding and save the encoded data to a file
+    encoded_img, max_dict_filled = lzw_encoder(img, block_size, max_dict_size)
+    with open("output.txt", "w") as f:
+        f.write(f"{height} {width} {block_size}\n")
+        for block in encoded_img:
+            f.write(" ".join(map(str, block)) + "\n")
+
+    # Calculate the compression ratio of the encoded image
+    compression_ratio = get_compression_ratio(
+        encoded_img, height, width, block_size, max_dict_size
+    )
+
+    # Decode the encoded image using LZW decoding
+    decoded_img = lzw_decoder(encoded_img, height, width, block_size, max_dict_size)
+
+    # Create a figure with two subplots for the original and decoded images
+    fig, axs = plt.subplots(1, 2, figsize=(10, 5))
+    fig.subplots_adjust(top=0.8)
+
+    # Set the title of the figure
+    fig.suptitle(
+        f"Compression Ratio = {compression_ratio:.2f}, Entropy = {entropy:.2f},\nMax Achievable Compression = {max_compression:.2f}, Maximum Dictionary Code Used = {max_dict_filled}"
+    )
+
+    # Display the original image in the first subplot
+    axs[0].imshow(img, cmap="gray")
+    axs[0].set_title("Original Image")
+
+    # Display the decoded image in the second subplot
+    axs[1].imshow(decoded_img, cmap="gray")
+    axs[1].set_title("Decoded Image")
+
+    # Show the figure
+    plt.show()