processing_node.py

import tempfile
import threading
import tempfile
import threading
import cv2
from mpi4py import MPI
from mpi4py import MPI
import numpy as np
from PIL import Image
from utilities import Utilities
from numpy import asarray
import cloudCredentials
import os
import argparse
import time
import io
import base64
from redis_db import redisDB
import os


class ProcessingNode:

    # # a variable to keep track of the number of instances working on the processing node
    # # to update status of processed image to "processed" when all instances are done processing
    # counter = 0
    # lock=threading.Lock()

    def __init__(self, **kwargs):
        self.comm = MPI.COMM_WORLD
        self.size = self.comm.Get_size()
        self.rank = self.comm.Get_rank()
        self.params = kwargs
        self.storage = cloudCredentials.Storage()

    def process_chunk(self, chunk, service_num, **kwargs):
        service_methods = {
            1: ("invert", {}),
            2: ("saturate", {"saturation_scale": kwargs.get("value", 0)}),
            3: ("rgb_to_gray", {}),
            4: ("gray_to_rgb", {}),
            6: (
                "apply_lowpass_filter",
                {
                    "cutoff_frequency": kwargs.get("cutoff_frequency", 1.0),
                    "order": kwargs.get("order", 1),
                },
            ),
            7: (
                "apply_highpass_filter",
                {
                    "cutoff_frequency": kwargs.get("cutoff_frequency", 1.0),
                    "order": kwargs.get("order", 1),
                },
            ),
            8: ("blur_image", {"kernel_size": kwargs.get("kernel_size", 5)}),
            9: ("sharpen_image", {}),
            10: (
                "remove_gaussian_noise",
                {"kernel_size": kwargs.get("kernel_size", 3)},
            ),
            11: (
                "remove_salt_pepper_noise",
                {"kernel_size": kwargs.get("kernel_size", 3)},
            ),
            12: ("sobel_filter", {"kernel_size": kwargs.get("kernel_size", 3)}),
            13: ("prewitt_filter", {}),
            14: ("roberts_filter", {}),
            15: (
                "canny_edge_filter",
                {
                    "threshold1": kwargs.get("threshold1", 50),
                    "threshold2": kwargs.get("threshold2", 150),
                },
            ),
            16: (
                "hough_transform",
                {
                    "rho": kwargs.get("rho", 1),
                    "theta": kwargs.get("theta", np.pi / 180),
                    "threshold": kwargs.get("threshold", 100),
                },
            ),
            17: (
                "harris_corner_detection",
                {
                    "blockSize": kwargs.get("blockSize", 2),
                    "ksize": kwargs.get("ksize", 3),
                    "k": kwargs.get("k", 0.04),
                },
            ),
            18: (
                "binary_threshold",
                {"threshold_value": kwargs.get("threshold_value", 128)},
            ),
            19: ("otsu_threshold", {}),
            20: (
                "gaussian_adaptive_threshold",
                {
                    "block_size": kwargs.get("block_size", 3),
                    "constant": kwargs.get("constant", 0),
                },
            ),
            21: ("apply_lowpass_filter",
                 {
                     "cutoff_frequency": kwargs.get("cutoff_frequency", 50),
                     "order": kwargs.get("order", 2),
                 },),
            22: ("apply_highpass_filter",
                 {
                     "cutoff_frequency": kwargs.get("cutoff_frequency", 50),
                     "order": kwargs.get("order", 2),
                 },),
            23: ("mean_adaptive_threshold",
                 {
                     "block_size": kwargs.get("block_size", 3),
                     "constant": kwargs.get("constant", 0),
                 },
                 ),
            24: ("gaussian_threshold",
                 {"threshold_value": kwargs.get("threshold_value", 128)},
                 ),
        }

        if service_num in service_methods:
            method_name, params = service_methods[service_num]
            method = getattr(Utilities, method_name)
            processed_chunk = method(chunk, **params)
        else:
            raise ValueError(f"Service number {service_num} is not valid.")

        return processed_chunk

    def convert_image_to_array(self, image):
        print(f"IMAGE : {image}")
        try:
            img=None
            img = Image.open(image)
        except Exception as e:
            print(f"Failed to open image: {e}")
            while img is None:
                try:
                    img = Image.open(image)
                except Exception as e:
                    print(f"trying to open image again")
                    time.sleep(0.5)
        img_pixels = asarray(img)
        print(type(img_pixels))
        # print(numpydata)
        print(img_pixels.shape)
        return img_pixels

    def reconstruct_array(self, result_array):
        min_val = np.min([np.min(chunk) for chunk in result_array if chunk is not None])
        max_val = np.max([np.max(chunk) for chunk in result_array if chunk is not None])
        result_array = [
            ((chunk - min_val) * (255 / (max_val - min_val))).astype("uint8")
            for chunk in result_array
            if chunk is not None
        ]
        result_array = np.concatenate(result_array)
        # Convert the array to an imagec
        if len(result_array.shape) == 2:
            image = Image.fromarray(result_array, "L")
        else:
            image = Image.fromarray(result_array, "RGB")
        return image
    
    def remove_overlapping(self,image, overlap, rank):

        if rank == 1:
            piece = image[:-overlap + 1, :]
        elif rank == self.size - 1:
            piece = image[overlap:, :]
        else:
            piece = image[overlap:-overlap + 1, :]
        return piece


    def run(self, task_id, kernel_size=15, service_num=1):
        # with ProcessingNode.lock:
        # ProcessingNode.counter += 1
        # print("COUNTER INTIAL : ", ProcessingNode.counter)
        # print("SIZE : ", self.size)
        # if ProcessingNode.counter == self.size:
        pull_task= redisDB.pull(task_id)
        status=pull_task.get("status")
        #in case a processing node failed , do not change the status , process the image again
        if (status !="In Progress (Processing)"):
            redisDB.update_image_status(task_id, {"status": "In Progress (Processing)",
                                                "link": 'None'})
        # ProcessingNode.counter = 0
        test_r = redisDB.pull(task_id)
        print("PROCESSING STATUS TEST : ", test_r)
        try:
            image = self.storage.get_image(task_id)
        except Exception as e:
            print(f"Failed to retrieve image from Google Cloud Storage: {e}")
            return
        cv2.imwrite(f"original_image.png", image)
        time.sleep(2)
        image_array = self.convert_image_to_array("original_image.png")

        if service_num in [6, 7, 21, 22]:
            # Sequential processing for specified service numbers
            processed_chunk = self.process_chunk(image_array, service_num, **self.params)
            #reconstructed_image = self.reconstruct_array([processed_chunk])
            #reconstructed_image.save("reconstructed_image.png")
            #reconstructed_image = np.array(reconstructed_image)
            time.sleep(0.5)
            try:
                self.storage.upload_image(processed_chunk, task_id)
            except Exception as e:
                    print(f"Failed to upload image to Google Cloud Storage: {e}")
                    while processed_chunk is None:
                        try:
                            self.storage.upload_image(processed_chunk, task_id)
                            print(f"trying to upload image again"+task_id)
                        except Exception as e:
                            time.sleep(0.5)
            time.sleep(0.5)
            try:
                img_link = self.storage.create_signed_url(task_id)
            except Exception as e:
                print(f"Failed to create signed URL: {e}")
                while img_link is None:
                    try:
                        img_link = self.storage.create_signed_url(task_id)
                    except Exception as e:
                        print(f"Failed to create signed URL: {e}")
                        time.sleep(0.5)            
            redisDB.update_image_status(task_id, {"status": "Processed",
                                                  "link": img_link})
            test_r = redisDB.pull(task_id)
            print("PROCESSED STATUS TEST : ", test_r)
        else:
            chunk_size_row = image_array.shape[0] // (self.size - 1)
            chunk_size_col = image_array.shape[1]
            num_channels = image_array.shape[2]
            print(f"Chunk num of channels: {num_channels}")
            chunk_size = (chunk_size_row, chunk_size_col, num_channels)
            overlap = kernel_size // 2
            print("overlap : ", overlap)
            if self.rank == 0:
                # with ProcessingNode.lock:
                # print("COUNTER modified by rank 0: ", ProcessingNode.counter)
                # ProcessingNode.counter += 1
                recv_chunks = []
                for i in range(1, self.size):
                    # Determine the slice indices
                    start_row = (chunk_size_row) * (i - 1)
                    end_row = (chunk_size_row) * i
                    print(f"Chunk size_{i}_BEFORE : ", start_row , " " , end_row, "total: ",end_row-start_row+1)
                    if i > 1:
                        start_row -= overlap
                        # print(f"{i} Entered IF 1")
                    if i < self.size - 1:
                        # print(f"{i} Entered IF 2")
                        # print("MY RANK @ END", self.comm.rank)
                        end_row += overlap
                    print("---------- i  : ", i, "start : ", start_row, "end :", end_row,"total: ",end_row-start_row+1)
                    # Extract chunk to be sent to worker
                    chunk = image_array[start_row:end_row, :, :]
                    print(f"Chunk size_{i}_AFTER : ", chunk.shape)
                    # Save the chunk as an image
                    cv2.imwrite(f"chunk_{i}.png", chunk)
                    # Scatter chunk to workers
                    self.comm.send(chunk, dest=i, tag=0)

                for i in range(1, self.size):
                    # Gather processed chunks from workers
                    processed_chunk = self.comm.recv(source=i, tag=0)
                    if kernel_size != 0:
                        if self.rank == 1:
                            processed_chunk = self.remove_overlapping(processed_chunk, overlap, self.rank)
                        elif self.rank == self.rank - 1:
                            processed_chunk = self.remove_overlapping(processed_chunk, overlap, self.rank)
                        else:
                            processed_chunk = self.remove_overlapping(processed_chunk,overlap,self.rank)
                    recv_chunks.append(processed_chunk)
                # Reconstruct using the received chunks
                reconstructed_image = self.reconstruct_array(recv_chunks)
                reconstructed_image.save("reconstructed_image.png")

                # Upload the reconstructed image to Google Cloud Storage
                reconstructed_image = np.array(reconstructed_image)
                time.sleep(0.5)
                try:
                    self.storage.upload_image(reconstructed_image, task_id)
                except Exception as e:
                    print(f"Failed to upload image to Google Cloud Storage: {e}")
                    while reconstructed_image is None:
                        try:
                            self.storage.upload_image(reconstructed_image, task_id)
                            print(f"trying to upload image again"+task_id)
                        except Exception as e:
                            time.sleep(0.5)
                time.sleep(0.5)
                try:
                    img_link = self.storage.create_signed_url(task_id)
                except Exception as e:
                    print(f"Failed to create signed URL: {e}")
                    while img_link is None:
                        try:
                            img_link = self.storage.create_signed_url(task_id)
                        except Exception as e:
                            print(f"Failed to create signed URL: {e}")
                            time.sleep(0.5)
                # with ProcessingNode.lock:
                # print("COUNTER : ", ProcessingNode.counter)
                # if ProcessingNode.counter == self.size:

                redisDB.update_image_status(task_id, {"status": "Processed",
                                                      "link": img_link})
                test_r = redisDB.pull(task_id)
                print("PROCESSED STATUS TEST : ", test_r)
                #os.remove("original_image.png")
                # return reconstructed_image
            else:
                # with ProcessingNode.lock:
                # ProcessingNode.counter += 1
                chunk = self.comm.recv(source=0, tag=0)
                cv2.imwrite(f"recived_chunk_{self.comm.rank}.png", chunk)
                # chunk = image_array[start_row:end_row, :, :]
                processed_chunk = self.process_chunk(chunk, service_num, **self.params)
                # Convert data type if necessary
                if processed_chunk.dtype != np.uint8:
                    processed_chunk = processed_chunk.astype(np.uint8)
                    print(f"Data type after conversion: {processed_chunk.dtype}")
                print(f"Processed chunk shape: {processed_chunk.shape}")
                # Save the processed_chunk array as an image using OpenCV
                cv2.imwrite("processed_chunk.png", processed_chunk)
                # Gather processed chunks on rank 0
                self.comm.send(processed_chunk, dest=0, tag=0)


if __name__ == "__main__":
    # Initialize the ProcessingNode with any required parameters
    parser = argparse.ArgumentParser(description='Process some integers.')
    parser.add_argument('task_id', type=str, help='Task ID')
    parser.add_argument('service_num', type=int, help='Service number')

    args = parser.parse_args()

    node = ProcessingNode()
    node.run(task_id=args.task_id, service_num=args.service_num)
    # Define the path to your test image
    # test_image_path = 'icon.png'
    # image = cv2.imread(test_image_path)

    # Define the service number for the image processing task
    # service_num = 6
    # task_id = 1
    node = ProcessingNode()
    node.run(task_id=args.task_id, service_num=args.service_num)