MTE.py

"""
    Server side to catch a camera stream from a client
"""

import os
import math

import argparse
import csv
import json
import time
from datetime import datetime
import cv2
import numpy as np

from pykson import Pykson
from imutils.video import FPS
import imagezmq
from zmq.error import ZMQError

from Domain.MTEMode import MTEMode
from Domain.ErrorLearning import ErrorLearning
from Domain.ErrorRecognition import ErrorRecognition
from Domain.ErrorInitialize import ErrorInitialize
from Domain.MTEAlgo import MTEAlgo
from Domain.LearningData import LearningData
from Domain.MTEResponse import MTEResponse
from Domain.MTEThreshold import MTEThreshold
from Domain.RecognitionData import RecognitionData
from Domain.ResponseData import ResponseData
from Domain.UserInformation import UserInformation
from Repository import Repository

from MLValidation import MLValidation
from SIFTEngine import SIFTEngine
from VCLikeEngine import VCLikeEngine

# CAM_MATRIX = np.array([[954.16160543, 0., 635.29854945], \
#     [0., 951.09864051, 359.47108905],  \
#         [0., 0., 1.]])

SAMPLE_FOLDER = "samples"

class MTE:
    """
    This class initializes a server that will listen to client
    and will compute motion tracking for the client.
    """

    def __init__(self, mte_algo=MTEAlgo.SIFT_KNN, crop_margin=1.0/6, resize_width=380, \
         ransacount=300, disable_blur=False, disable_centering=False, one_shot_mode=False, \
         disable_histogram_matching=False, debug_mode=False):
        print("Launching server")
        self.image_hub = imagezmq.ImageHub()
        self.image_hub.zmq_socket.RCVTIMEO = -1
        # self.image_hub = imagezmq.ImageHub(open_port='tcp://192.168.43.39:5555')

        self.repo = Repository()

        self.learning_db = []
        self.last_learning_data = None

        # ML validation
        self.ml_validator = MLValidation()

        self.format_resolution = None
        self.width_small = None
        self.width_medium = None
        self.width_large = None

        # Motion tracking engines
        self.mte_algo = mte_algo
        self.crop_margin = crop_margin
        self.resize_width = resize_width
        self.resize_height = int(resize_width*(1/(16/9)))
        self.validation_width = None
        self.validation_height = None
        self.disable_histogram_matching = disable_histogram_matching

        self.debug_mode = debug_mode

        if self.mte_algo == MTEAlgo.VC_LIKE:
            self.vc_like_engine = VCLikeEngine(one_shot_mode=one_shot_mode, \
                disable_histogram_matching = disable_histogram_matching, debug_mode=self.debug_mode)
        else:
            self.sift_engine = SIFTEngine(maxRansac=ransacount)

        self.threshold_small = MTEThreshold(100, 45, 3500, 1100, 12000, 4000, 13000)
        self.threshold_medium = MTEThreshold(100, 70, 3400, 1200, 14000, 5000, 18000)
        self.threshold_large = MTEThreshold(3500, 180, 3100, 750, 13000, 5500, 20000)

        self.rollback = 0
        self.orange_count_for_rollback = 0
        self.validation = 0
        self.devicetype = "CPU"
        self.resolution_change_allowed = 3

        self.reference = LearningData()

        self.debug = None
        self.server_csv = None
        self.result_csv = None

        self.disable_centering = disable_centering

        self.disable_blur = disable_blur
        if disable_blur:
            self.min_validation_count = 3
        else:
            self.min_validation_count = 5

        self.landscape_image = True

    def init_server_csv(self):
        """ This function create a log for the global activity of the server."""
        
        if not os.path.exists("logs_server"):
            os.makedirs("logs_server")
        log_location = os.path.join("logs_server", datetime.now().strftime("%m%d%Y_%H%M%S"))
        self.server_csv = open(log_location+'.csv', 'w')
        metrics = ['Timestamp', 'Action', 'Ref Client']
        writer = csv.DictWriter(self.server_csv, fieldnames=metrics)
        writer.writeheader()
        return writer

    def fill_server_log(self, writer, action, ref):
        """This function fill server's logs."""

        writer.writerow({'Timestamp' : datetime.now(),
                         'Action' : action,
                         'Ref Client': ref})

    def init_log(self, name):
        """ This function creates and initializes a writer.

        In : name -> String being the name of the csv file that will be created, can be a path
        Out : Writer object pointing to name.csv
        """
        self.result_csv = open(name+'.csv', 'w')
        metrics = ['Success', 'Flag', 'Code', 'Direction', 
                   'Number of keypoints', 'Number of matches',
                   'Distance Kirsh', 'Distance Canny', 'Distance Color',
                   'Translation x', 'Translation y',
                   'Scale x', 'Scale y',
                   'Blurred']
        writer = csv.DictWriter(self.result_csv, fieldnames=metrics)
        writer.writeheader()
        return writer

    def fill_log(self, writer, recognition, response, is_blurred):
        """ This function fill a csv files with the data set as input.

        In :    writer -> Object pointing to the csv file
                recognition -> results of the recognition
                response -> data that will be sent to client
                is blurred -> is the current image blurred
        """
        if self.result_csv is not None:
            if not isinstance(recognition.dist_roi, int):
                distance_kirsh = recognition.dist_roi[0]
                distance_canny = recognition.dist_roi[1]
                distance_color = recognition.dist_roi[2]
            else:
                distance_kirsh = ""
                distance_canny = ""
                distance_color = ""

            writer.writerow({'Success' : recognition.success,
                             'Number of keypoints' : recognition.nb_kp,
                             'Number of matches': recognition.nb_match,
                             'Distance Kirsh' : distance_kirsh,
                             'Distance Canny' : distance_canny,
                             'Distance Color' : distance_color,
                             'Translation x' : recognition.translations[0],
                             'Translation y' : recognition.translations[1],
                             'Scale x' : recognition.scales[0],
                             'Scale y' : recognition.scales[1],
                             'Flag' : response.flag,
                             'Code' : response.status,
                             'Direction' : response.user_information,
                             'Blurred' : is_blurred})

    def create_log(self):
        log_location = os.path.join("logs", "ref"+str(self.reference.id_ref))
        if not os.path.exists(log_location):
            os.makedirs(log_location)
        log_name = datetime.now().strftime("%m%d%Y_%H%M%S")
        log_path = os.path.join(log_location, log_name)
        log_writer = self.init_log(log_path)
        
        return log_writer

    def set_mte_parameters(self, ratio):
        """Edit values for globals parameters of the motion tracking engine."""

        if math.isclose(ratio, 16/9, rel_tol=1e-5):
            self.width_small = 400
            self.width_medium = 660
            self.width_large = 1730
            self.format_resolution = 16/9
        elif math.isclose(ratio, 4/3, rel_tol=1e-5):
            self.width_small = 350
            self.width_medium = 570
            self.width_large = 1730
            self.format_resolution = 4/3
        else:
            print("What kind of format is that ?")
            return False

        self.validation_width = self.width_small
        self.validation_height = int(self.validation_width*(1/self.format_resolution))
        if self.mte_algo in (MTEAlgo.SIFT_KNN, MTEAlgo.SIFT_RANSAC):
            self.sift_engine.set_parameters(self.width_small, self.width_medium,\
                                            self.width_large, self.format_resolution)
        elif self.mte_algo == MTEAlgo.VC_LIKE:
            self.vc_like_engine.set_parameters(self.format_resolution)

        return True

    def listen_images(self):
        """Receive a frame and an action from client then compute required operation

        The behaviour depend of the mode send : PRELEARNING/LEARNING/RECOGNITION
        This function has no proper value to return but will send a message to the client
        containing the operations' results.
        """

        server_log_writter = self.init_server_csv()
        while True:  # show streamed images until Ctrl-C
            msg, raw_image = self.image_hub.recv_image()

            data = json.loads(msg)

            if raw_image is None or not isinstance(raw_image, np.ndarray) or \
                "error" in data and data["error"] or \
                    "mode" not in data:
                # print("<<<<<<<<<<<<<<<<<< Error receiving garbage >>>>>>>>>>>>>>>>>>")
                data["mode"] = MTEMode.NEUTRAL.value
            
            else:
                h, w = raw_image.shape[:2]
                if h > w:
                    self.landscape_image = False
                    image = cv2.rotate(raw_image, cv2.ROTATE_90_CLOCKWISE)
                else:
                    self.landscape_image = True
                    image = raw_image

            if self.mte_algo == MTEAlgo.VC_LIKE and MTEMode(data["mode"]) != MTEMode.NEUTRAL:
                h, w = image.shape[:2]
                if math.isclose(float(w)/h, 4/3, rel_tol=1e-5):
                    new_h = int(w * (1 / (16 / 9)))
                    limits = int((h - new_h) / 2)
                    croped = image[int(limits): int(h-limits), \
                        0: w]
                    image = croped.copy()

            if MTEMode(data["mode"]) == MTEMode.VALIDATION_REFERENCE:
                t0 = time.time()
                self.rollback = 0
                self.validation = 0
                self.resolution_change_allowed = 3
                resolution_valid = self.set_mte_parameters(image.shape[1]/image.shape[0])
                t1 = time.time()
                if resolution_valid:
                    status = self.learning(image)
                    to_send = {
                        "status": status.value,
                        "mte_parameters": {}
                    }
                    # self.reference.mte_parameters["ratio"] = self.format_resolution
                    if status == ErrorLearning.SUCCESS:
                        to_send["mte_parameters"] = self.reference.change_parameters_type_for_sending()
                
                        # Samples
                        if not os.path.exists(SAMPLE_FOLDER):
                            os.makedirs(SAMPLE_FOLDER)

                        if not os.path.exists(os.path.join(SAMPLE_FOLDER, str(self.reference.id_ref))):
                            os.makedirs(os.path.join(SAMPLE_FOLDER, str(self.reference.id_ref)))
                        
                        cv2.imwrite(os.path.join(SAMPLE_FOLDER, str(self.reference.id_ref), "Ref.png"), raw_image)
                else:
                    print("Invalid format.")
                    to_send = {
                        "status" : ErrorLearning.INVALID_FORMAT.value
                    }

                # Cleaning
                self.reference.clean_control_assist(self.reference.id_ref)
                data["id_ref"] = None
                t2 = time.time()
                # print("<<<<<<<<<<<<<<<< Calcul = {}, Change = {}, Total = {} >>>>>>>>>>>".format(t1-t0, t2-t1, t2-t0))

            elif MTEMode(data["mode"]) == MTEMode.INITIALIZE_MTE:
                if data["mte_parameters"]["ratio"] is None:
                    to_send = {
                        "status" : ErrorInitialize.ERROR.value
                    }
                    print("Error inside parameters for init.")
                # elif (not self.reference.is_empty()) and self.reference.id_ref != data["id_ref"]:
                #     to_send = {
                #         "status" : ErrorInitialize.NEED_TO_CLEAR_MTE.value
                #     }
                #     print("Engine already initialized with a different ref.")
                #     # Pas de retour d'id car MTEMode.CLEAR_MTE s'en occupe
                else:
                    # Clear MTE 
                    self.clear_mte()

                    # Initialize MTE
                    self.rollback = 0
                    self.validation = 0
                    self.resolution_change_allowed = 3
                    self.orange_count_for_rollback = 0
                    self.format_resolution = data["mte_parameters"]["ratio"]
                    self.set_mte_parameters(self.format_resolution)
                    init_status = self.reference.initialiaze_control_assist\
                        (data["id_ref"], data["mte_parameters"])
                    
                    if self.mte_algo == MTEAlgo.VC_LIKE:
                        self.vc_like_engine.init_engine(self.reference)

                    if init_status == 0:
                        log_writer = self.create_log()
                    if os.path.isfile('temporaryData.txt'):
                        os.remove('temporaryData.txt')
                    with open('temporaryData.txt', 'w') as json_file:
                        to_save_parameters = self.reference.change_parameters_type_for_sending()
                        to_save = {
                            "id_ref" : data["id_ref"],
                            "mte_parameters" : to_save_parameters
                        }
                        json.dump(to_save, json_file)

                    to_send = {
                        "status" : init_status
                    }
                    if self.mte_algo != MTEAlgo.VC_LIKE:
                        target = (self.width_medium, \
                                int(self.width_medium*(1/self.format_resolution)))
                    else:
                        target = (self.vc_like_engine.image_width, \
                            self.vc_like_engine.image_height)

            elif MTEMode(data["mode"]) == MTEMode.MOTION_TRACKING:
                if (self.reference.id_ref is None) and (os.path.isfile('temporaryData.txt')):
                    print("Restoring data from temporaryData.")
                    with open('temporaryData.txt') as json_file:
                        data_restored = json.load(json_file)
                        self.format_resolution = data_restored["mte_parameters"]["ratio"]
                        self.set_mte_parameters(self.format_resolution)
                        self.reference.initialiaze_control_assist(data_restored["id_ref"], data_restored["mte_parameters"])
                        
                        if self.mte_algo == MTEAlgo.VC_LIKE:
                            self.vc_like_engine.init_engine(self.reference)
                        
                        log_writer = self.create_log()
                        data = data_restored
                        data["mode"] = MTEMode.MOTION_TRACKING
                    target = (self.width_medium, \
                            int(self.width_medium*(1/self.format_resolution)))
                if self.reference.id_ref is None:
                    print("Engine is not initialized.")
                    to_send = {
                        "status" : ErrorRecognition.ENGINE_IS_NOT_INITIALIZED.value
                    }
                elif data["id_ref"] != self.reference.id_ref:
                    print("Wrong initialization.")
                    to_send = {
                        "status" : ErrorRecognition.MISMATCH_REF.value
                    }
                else:
                    self.debug = image.copy()
                    if self.devicetype == "CPU" and image.shape[1] > self.width_medium:
                        image = cv2.resize(image, target,\
                                 interpolation=cv2.INTER_AREA)

                    results = self.recognition(image)
                    if self.mte_algo == MTEAlgo.VC_LIKE:
                        response_type = results[-1]
                        results = RecognitionData(*results[:-1])
                    else:
                        results = RecognitionData(*results)

                    if self.mte_algo == MTEAlgo.VC_LIKE:
                        response = self.behaviour_vc_like_engine(results, response_type)
                    elif image.shape[1] == self.width_small:
                        response = self.behaviour_width_small(results)
                    elif image.shape[1] == self.width_medium:
                        response = self.behaviour_width_medium(results)
                    elif image.shape[1] == self.width_large:
                        response = self.behaviour_width_large(results)
                    else:
                        print("Image size not supported.")
                        response = ResponseData(\
                                                [self.width_small,\
                                                self.width_small*(1/self.format_resolution)],\
                                                MTEResponse.RED, 0, 0, UserInformation.CENTERED, \
                                                0, 0, ErrorRecognition.MISMATCH_SIZE_WITH_REF)

                    # If we can capture
                    is_blurred = False
                    if self.validation > self.min_validation_count:
                        self.validation = self.min_validation_count
                    if self.validation == self.min_validation_count:
                        is_blurred = self.is_image_blurred(image, \
                            size=int(response.requested_image_size[0]/18))
                        # if the image is not blurred else we just return green
                        if self.disable_blur:
                            if response.user_information == UserInformation.CENTERED:
                                response.flag = MTEResponse.CAPTURE
                        else:
                            if not is_blurred[1] and response.user_information == UserInformation.CENTERED:
                                response.flag = MTEResponse.CAPTURE
                    temp_x = response.target_data["translations"][0]
                    temp_y = response.target_data["translations"][1]
                    if temp_x is not None and temp_y is not None:
                        response.target_data["translations"] = (temp_x * (self.debug.shape[1]/target[0]), temp_y * (self.debug.shape[0]/target[1]))
                    to_send = response.to_dict()
                    self.fill_log(log_writer, results, response, is_blurred)
                    target = (response.requested_image_size[0], response.requested_image_size[1])

                    target = (response.requested_image_size[0], response.requested_image_size[1])

                    
                    # Samples
                    cv2.imwrite(os.path.join(SAMPLE_FOLDER, str(self.reference.id_ref), str(time.time()) + ".png"), raw_image)

            elif MTEMode(data["mode"]) == MTEMode.CLEAR_MTE :
                if "id_ref" in data and data["id_ref"] is not None:
                    status, id_ref = self.clear_mte(data["id_ref"])
                    to_send = {
                        "status" : status,
                        "id_ref" : id_ref
                    }
                else:
                    print("No reference id provided.")
                    to_send = {
                        "status" : 1
                    }
                
            elif MTEMode(data["mode"]) == MTEMode.FORCE_CLEAR_MTE:
                status, _ = self.clear_mte()
                to_send = {
                    "status" : status
                }
            elif MTEMode(data["mode"]) == MTEMode.RUNNING_VERIFICATION:
                to_send = {
                    "status" : 0
                }
            else:
                # Impossible
                to_send = {
                    "status" : 1
                }
                print("An error occured.")

            if "id_ref" in data:
                self.fill_server_log(server_log_writter, MTEMode(data["mode"]), \
                    data["id_ref"])

            try:
                self.image_hub.send_reply(json.dumps(to_send).encode())
            except ZMQError:
                # Timeout reached
                continue
    
    def clear_mte(self, id_ref=None):
        status = self.reference.clean_control_assist(id_ref)

        if status != 0:
            id_ref = self.reference.id_ref
            print("Clean failed, wrong reference id.")
        else:
            if os.path.isfile('temporaryData.txt'):
                os.remove('temporaryData.txt')

            id_ref = -1
            self.rollback = 0
            self.validation = 0
            self.resolution_change_allowed = 3
            self.orange_count_for_rollback = 0

            if self.result_csv is not None:
                self.result_csv = self.result_csv.close()

            print("Clean success.")

        return status, id_ref

    def is_image_blurred(self, image, size=60, thresh=10):
        """Check if an image is blurred. Return a tuple (mean: float, blurred: bool)

        Keyword arguments:
        image -> the image to test as array
        size -> the radius size around the center that will be used in FFTShift (default 60)
        thresh -> the threshold value for the magnitude comparaison (default 15)
        """

        # cv2.imshow("Input image", image)

        mean, is_blurred = self.is_blurred_fft(image, size, thresh)
        # mean, is_blurred = self.is_blurred_laplacian(image, thresh)

        return mean, is_blurred
    
    def is_blurred_fft(self, image, size=60, thresh=10):
        # Histogram equalization
        hist, bins = np.histogram(image.flatten(), 256, [0,256])
        cdf = hist.cumsum()

        cdf_m = np.ma.masked_equal(cdf, 0)
        cdf_m = (cdf_m - cdf_m.min())*255 / (cdf_m.max() - cdf_m.min())
        cdf = np.ma.filled(cdf_m, 0).astype('uint8')

        equalized_image = cdf[image]

        # cv2.imshow("Equalized image", equalized_image)

        (height, width, _) = equalized_image.shape
        (center_x, center_y) = (int(width / 2.0), int(height / 2.0))
        fft = np.fft.fft2(equalized_image)
        fft_shift = np.fft.fftshift(fft)
        fft_shift[center_y - size:center_y + size, center_x - size:center_x + size] = 0
        fft_shift = np.fft.ifftshift(fft_shift)
        recon = np.fft.ifft2(fft_shift)
        magnitude = 20 * np.log(np.abs(recon))
        mean = np.mean(magnitude)

        # cv2.waitKey(0)

        return (mean, mean <= thresh)
    
    def is_blurred_laplacian(self, image, thresh=10):
        score = cv2.Laplacian(image, cv2.CV_64F).var()
        grey_image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
        contrast = grey_image.std()

        return (score, score <= thresh)

    def compute_direction(self, translation_value, scale_value, size_w):
        """Return a string representing a cardinal direction.

        Keyword arguments:
        translation -> tuple containing homographic estimations of x,y
        size_w -> the width of the current image
        """
        if self.disable_centering:
            divider = 50
        else:
            divider = 10

        tolerance = float(divider)/100
        size_h = int(size_w*(1/self.format_resolution))

        if not self.landscape_image:
            temp = size_w
            size_w = size_h
            size_h = temp

        center = (translation_value[0]*scale_value[0]+size_w/2, \
            translation_value[1]*scale_value[1]+int(size_h/2))

        direction = UserInformation.CENTERED


        if center[1] < (size_h/2 - size_w*tolerance):
            if center[0] < (size_w/2 - size_w*tolerance):
                direction = UserInformation.UP_LEFT
            elif center[0] > (size_w/2 + size_w*tolerance):
                direction = UserInformation.UP_RIGHT
            else:
                if center[1] < (size_h/2 - size_w*tolerance*2):
                    direction = UserInformation.BIG_UP
                else:
                    direction = UserInformation.UP

        elif center[1] > (size_h/2 + size_w*tolerance):
            if center[0] < (size_w/2 - size_w*tolerance):
                direction = UserInformation.DOWN_LEFT
            elif center[0] > (size_w/2 + size_w*tolerance):
                direction = UserInformation.DOWN_RIGHT
            else:
                if center[1] > (size_h/2 + size_w*tolerance*2):
                    direction = UserInformation.BIG_DOWN
                else:
                    direction = UserInformation.DOWN

        else:
            if center[0] < (size_w/2 - size_w*tolerance*2):
                direction = UserInformation.BIG_LEFT
            elif center[0] < (size_w/2 - size_w*tolerance):
                direction = UserInformation.LEFT
            elif center[0] > (size_w/2 + size_w*tolerance*2):
                direction = UserInformation.BIG_RIGHT
            elif center[0] > (size_w/2 + size_w*tolerance):
                direction = UserInformation.RIGHT
            else:
                direction = UserInformation.CENTERED

        # center_kp = cv2.KeyPoint(center[0], center[1], 8)
        # to_draw = cv2.drawKeypoints(self.debug, [center_kp], \
        # np.array([]), (255, 0, 0), cv2.DRAW_MATCHES_FLAGS_DRAW_RICH_KEYPOINTS)
        # cv2.imshow("Direction", to_draw)
        # cv2.waitKey(1)
        return direction
    
    def behaviour_vc_like_engine(self, results, response_type):
        direction = self.compute_direction(results.translations, results.scales, self.vc_like_engine.image_width)
        
        if response_type == MTEResponse.CAPTURE and direction != UserInformation.CENTERED:
            response_type = MTEResponse.GREEN

        response = ResponseData(\
                                [self.vc_like_engine.image_width,\
                                self.vc_like_engine.image_height],\
                                response_type, results.translations[0], results.translations[1], \
                                direction, \
                                results.scales[0], results.scales[1], ErrorRecognition.SUCCESS)
        
        return response

    def red_width_small(self):
        """Critical recognition behaviour for an image (_, 380).
        Return a ResponseData and change global variables.
        """

        width = self.width_small
        self.rollback += 1
        if self.validation > 0:
            self.validation -= 1
        if self.rollback >= 5:
            self.rollback = 0
            width = self.width_medium
        return ResponseData([width, int(width*(1/self.format_resolution))],\
             MTEResponse.RED, None, None, None, None, None)

    def orange_behaviour(self, results, width):
        """Uncertain recognition behaviour.
        Return a ResponseData and change global variables.

        Keyword arguments:
        results -> the RecognitionData
        size -> the width of the image
        """

        new_width = width
        if self.validation > 0:
            self.validation -= 1
        if width == self.width_small and self.orange_count_for_rollback >= 2:
            new_width = self.width_medium
            self.orange_count_for_rollback = 0
            self.resolution_change_allowed -= 1
        elif width == self.width_small:
            self.orange_count_for_rollback += 1

        return ResponseData([new_width, int(new_width*(1/self.format_resolution))], MTEResponse.ORANGE,\
                            results.translations[0], results.translations[1], \
                            self.compute_direction(results.translations, results.scales, width), \
                            results.scales[0], results.scales[1])

    def red_width_medium(self):
        """Critical recognition behaviour for an image (_, 640).
        Return a ResponseData and change global variables.
        """

        width = self.width_medium
        msg = MTEResponse.RED
        if self.devicetype == "CPU":
            self.validation = 0
            msg = MTEResponse.TARGET_LOST
        else:
            self.rollback += 1
            if self.rollback >= 5:
                width = self.width_large
                self.rollback = 0
        return ResponseData([width, int(width*(1/self.format_resolution))],\
             msg, None, None, None, None, None)

    def green_width_medium(self, results):
        """Behaviour for an image (_, 640) when the flag turns on to be green.
        Return a ResponseData and change global variable.

        Keyword arguments:
        results -> the RecognitionData
        """

        width = self.width_medium
        if self.resolution_change_allowed > 0:
            self.resolution_change_allowed -= 1
            width = self.width_small
            self.validation = 0
            self.rollback = 0
            self.orange_count_for_rollback = 0
        else:
            self.validation += 1
        return ResponseData(\
            [width, int(width*(1/self.format_resolution))],\
            MTEResponse.GREEN,\
            results.translations[0], results.translations[1],\
            self.compute_direction(results.translations,\
                results.scales, self.width_medium), \
            results.scales[0], results.scales[1])

    def lost_width_large(self):
        """Behaviour for a image (_, 1730) when the target is lost
        Return a ResponseData.
        """

        msg = MTEResponse.TARGET_LOST
        return ResponseData([self.width_large, int(self.width_large*(1/self.format_resolution))],\
             msg, None, None, None, None, None)

    def behaviour_width_small(self, results):
        """Global behaviour for recognition of image (_,380).
        Based on the activity diagram.
        Return a ResponseData.

        Keyword arguments:
        results -> the RecognitionData
        """

        response = MTEResponse.RED
        # If not enough keypoints
        if results.nb_kp < self.threshold_small.nb_kp:
            response_for_client = self.red_width_small()
            response_for_client.set_status(ErrorRecognition.NOT_ENOUGHT_KEYPOINTS)
        # If not enough matches
        elif results.nb_match < self.threshold_small.nb_match:
            # If homography doesn't even start
            if results.nb_match < 30:
                response_for_client = self.red_width_small()
                response_for_client.set_status(ErrorRecognition.NOT_ENOUGHT_MATCH_CRITICAL)
            else:
                response_for_client = self.orange_behaviour(results, self.width_small)
                response_for_client.set_status(ErrorRecognition.NOT_ENOUGHT_MATCH)
        else:
            response = MTEResponse.GREEN
            # If not centered with target
            if not results.success:
                self.validation = 0
                response_for_client = ResponseData(\
                                [self.width_small,\
                                int(self.width_small*(1/self.format_resolution))],\
                                response,\
                                results.translations[0], results.translations[1], \
                                self.compute_direction(results.translations,\
                                    results.scales, self.width_small), \
                                results.scales[0], results.scales[1],\
                                status=ErrorRecognition.WRONG_POINT_OF_VIEW)
            else:
                dist_kirsh = results.dist_roi[0] < self.threshold_small.mean_kirsh
                dist_canny = results.dist_roi[1] < self.threshold_small.mean_canny
                dist_color = results.dist_roi[2] < self.threshold_small.mean_color
                # If 0 or 1 mean valid
                if int(dist_kirsh)+int(dist_canny)+int(dist_color) < 2:
                    response_for_client = self.orange_behaviour(results, self.width_small)
                    response_for_client.set_status(ErrorRecognition.MEANS_OUT_OF_LIMITS)
                else:
                    dist_kirsh = results.dist_roi[0] < self.threshold_small.kirsh_aberration
                    dist_color = results.dist_roi[2] < self.threshold_small.color_aberration
                    # If no aberration
                    if int(dist_kirsh)+int(dist_color) == 2:
                        self.validation += 1
                        self.rollback = 0
                        status = ErrorRecognition.SUCCESS
                    else:
                        response = MTEResponse.ORANGE
                        status = ErrorRecognition.ABERRATION_VALUE
                    response_for_client = ResponseData(\
                        [self.width_small, int(self.width_small*(1/self.format_resolution))],\
                        response,\
                        results.translations[0], results.translations[1], \
                        self.compute_direction(results.translations, \
                            results.scales, self.width_small), \
                        results.scales[0], results.scales[1], status=status)

        if response_for_client.flag == MTEResponse.GREEN:
            self.rollback = 0
        return response_for_client

    def behaviour_width_medium(self, results):
        """Global behaviour for recognition of image (_,640).
        Based on the activity diagram.
        Return a ResponseData.

        Keyword arguments:
        results -> the RecognitionData
        """

        if results.nb_kp < self.threshold_medium.nb_kp:
            response_for_client = self.red_width_medium()
            response_for_client.set_status(ErrorRecognition.NOT_ENOUGHT_KEYPOINTS)
        # If not enough matches
        elif results.nb_match < self.threshold_medium.nb_match:
            # If homography doesn't even start
            if results.nb_match < 30:
                response_for_client = self.red_width_medium()
                response_for_client.set_status(ErrorRecognition.NOT_ENOUGHT_MATCH_CRITICAL)
            else:
                response_for_client = self.orange_behaviour(results, self.width_medium)
                response_for_client.set_status(ErrorRecognition.NOT_ENOUGHT_MATCH)
        else:
            response = MTEResponse.GREEN
            # If not centered with target
            if not results.success:
                response_for_client = ResponseData([self.width_medium,\
                    int(self.width_medium*(1/self.format_resolution))], response,\
                    results.translations[0], results.translations[1], \
                    self.compute_direction(results.translations,\
                        results.scales, self.width_medium), \
                    results.scales[0], results.scales[1],\
                    status=ErrorRecognition.WRONG_POINT_OF_VIEW)
            else:
                dist_kirsh = results.dist_roi[0] < self.threshold_medium.mean_kirsh
                dist_canny = results.dist_roi[1] < self.threshold_medium.mean_canny
                dist_color = results.dist_roi[2] < self.threshold_medium.mean_color
                # If 0 or 1 mean valid
                if int(dist_kirsh)+int(dist_canny)+int(dist_color) < 2:
                    response_for_client = self.orange_behaviour(results, self.width_medium)
                    response_for_client.set_status(ErrorRecognition.MEANS_OUT_OF_LIMITS)
                # If all means are valids
                elif int(dist_kirsh)+int(dist_canny)+int(dist_color) == 3:
                    response_for_client = self.green_width_medium(results)
                    response_for_client.set_status(ErrorRecognition.SUCCESS)
                else:
                    dist_kirsh = results.dist_roi[0] < self.threshold_medium.kirsh_aberration
                    dist_color = results.dist_roi[2] < self.threshold_medium.color_aberration
                    # If no aberration
                    if int(dist_kirsh)+int(dist_color) == 2:
                        response_for_client = self.green_width_medium(results)
                        response_for_client.set_status(ErrorRecognition.SUCCESS)
                    else:
                        response_for_client = self.orange_behaviour(results, self.width_medium)
                        response_for_client.set_status(ErrorRecognition.ABERRATION_VALUE)

        if response_for_client.flag == MTEResponse.GREEN:
            self.rollback = 0
        return response_for_client

    def behaviour_width_large(self, results):
        """Global behaviour for recognition of image (_,1730).
        Based on the activity diagram.
        Return a ResponseData.

        Keyword arguments:
        results -> the RecognitionData
        """

        if results.nb_kp < self.threshold_large.nb_kp:
            response_for_client = self.lost_width_large()
            response_for_client.set_status(ErrorRecognition.NOT_ENOUGHT_KEYPOINTS)
        # If not enough matches
        elif results.nb_match < self.threshold_large.nb_match:
            response_for_client = self.lost_width_large()
            response_for_client.set_status(ErrorRecognition.NOT_ENOUGHT_MATCH_CRITICAL)
        else:
            response = MTEResponse.GREEN
            # If not centered with target
            if not results.success:
                response_for_client = ResponseData([self.width_large,\
                    int(self.width_large*(1/self.format_resolution))], response,\
                    results.translations[0], results.translations[1], \
                    self.compute_direction(results.translations,\
                        results.scales, self.width_large), \
                    results.scales[0], results.scales[1],\
                    status=ErrorRecognition.SUCCESS)
            else:
                dist_kirsh = results.dist_roi[0] < self.threshold_large.mean_kirsh
                dist_canny = results.dist_roi[1] < self.threshold_large.mean_canny
                dist_color = results.dist_roi[2] < self.threshold_large.mean_color
                # If 0 or 1 mean valid
                if dist_kirsh+dist_canny+dist_color < 2:
                    response_for_client = self.lost_width_large()
                    response_for_client.set_status(ErrorRecognition.MEANS_OUT_OF_LIMITS)
                # If all means are valids
                elif dist_kirsh+dist_canny+dist_color == 3:
                    response_for_client = ResponseData([self.width_medium,\
                        int(self.width_medium*(1/self.format_resolution))], response,\
                        results.translations[0], results.translations[1], \
                        self.compute_direction(results.translations,\
                            results.scales, self.width_large), \
                        results.scales[0], results.scales[1],\
                        status=ErrorRecognition.SUCCESS)
                else:
                    dist_kirsh = results.dist_roi[0] < self.threshold_large.kirsh_aberration
                    dist_color = results.dist_roi[2] < self.threshold_large.color_aberration
                    # If no aberration
                    if dist_kirsh+dist_color == 2:
                        size = self.width_medium
                        status = ErrorRecognition.SUCCESS
                    else:
                        response = MTEResponse.ORANGE
                        size = self.width_large
                        status = ErrorRecognition.ABERRATION_VALUE
                    response_for_client = ResponseData([size,\
                        int(size*(1/self.format_resolution))], response,\
                        results.translations[0], results.translations[1], \
                        self.compute_direction(results.translations,\
                            results.scales, self.width_large), \
                        results.scales[0], results.scales[1], status=status)
        return response_for_client

    def fake_init_for_reference(self, image_ref):
        """Initialize learning datas with the reference and avoid the use of database.

        Keyword arguments:
        image_ref -> int array of the reference in full size
        """

        self.reference = LearningData()

        if self.mte_algo == MTEAlgo.VC_LIKE:
            self.vc_like_engine.learn(image_ref, self.reference)
            self.vc_like_engine.init_engine(self.reference)
        else:
            self.sift_engine.learn(image_ref, self.reference, \
                crop_image=True, crop_margin=self.crop_margin)
        self.ml_validator.learn(self.reference, image_ref)
        self.last_learning_data = self.reference

    def test_filter(self, blurred_image):
        """Test the recognition between the input and the image learned with fakeInitForReference.
        Return a RecognitionData

        Keyword arguments:
        blurred_image -> int array of the blurred reference
        """

        dim = (self.validation_width, self.validation_height)
        blurred_redux = cv2.resize(blurred_image, dim, interpolation=cv2.INTER_AREA)

        results = self.recognition(blurred_redux, testing_mode=True)
        if self.mte_algo == MTEAlgo.VC_LIKE:
            results = RecognitionData(*results[:-1])
        else:
            results = RecognitionData(*results)

        return results

    def crop_image(self, image, crop_margin):
        h, w = image.shape[:2]
        croped = image[int(h*crop_margin): int(h*(1-crop_margin)), \
            int(w*crop_margin): int(w*(1-crop_margin))]

        return croped

    def check_reference(self, image_ref):
        """Check if the image given is a valid reference.
        Return a dictinnary with 2 boolean:
        success -> is the given image valid as reference
        blurred -> is the given image blurred

        Keyword arguments:
        image_ref -> int array of the potential reference
        """

        size = int(image_ref.shape[1]/18)

        if not self.disable_blur:
            blurred = self.is_image_blurred(self.crop_image(image_ref, 1/3), \
                            size=size)
            if blurred[1]:
                print("The image is blurred")
                return ErrorLearning.ERROR_REFERENCE_IS_BLURRED

        kernel_size = 10
        sigma = 3
        kernel = 15
        # kernel_size = 2
        # sigma = 3
        # kernel = 1

        kernel_v = np.zeros((kernel_size, kernel_size))
        kernel_v[:, int((kernel_size - 1)/2)] = np.ones(kernel_size)
        kernel_v /= kernel_size

        kernel_h = np.zeros((kernel_size, kernel_size))
        kernel_h[int((kernel_size - 1)/2), :] = np.ones(kernel_size)
        kernel_h /= kernel_size

        self.fake_init_for_reference(image_ref)

        # Gaussian noise
        image_gaussian_blur = cv2.GaussianBlur(image_ref, (kernel, kernel), sigma)
        results = self.test_filter(image_gaussian_blur)
        # results = self.test_filter(image_ref)
        if not results.success:
            print("Failure gaussian blur")
            return ErrorLearning.GAUSSIAN_BLUR_FAILURE

        # Vertical motion blur.
        image_vertical_motion_blur = cv2.filter2D(image_ref, -1, kernel_v)
        results = self.test_filter(image_vertical_motion_blur)
        # results = self.test_filter(image_ref)

        if not results.success:
            print("Failure vertical blur")
            return ErrorLearning.VERTICAL_BLUR_FAILURE

        # Horizontal motion blur.
        image_horizontal_motion_blur = cv2.filter2D(image_ref, -1, kernel_h)
        results = self.test_filter(image_horizontal_motion_blur)
        # results = self.test_filter(image_ref)

        if not results.success:
            print("Failure horizontal blur")
            return ErrorLearning.HORIZONTAL_BLUR_FAILURE

        # All 3 noises are valid
        print("Valid for reference.")

        return ErrorLearning.SUCCESS

    def learning(self, full_image):
        """Test if the given image can be used as reference.
        Return a dictionary containing :
        success for global success
        blurred to indicate if the image is blurred
        learning_id for the position of the image in the DB

        Keyword arguments:
        full_image -> int array of the image
        """

        return self.check_reference(full_image)

    def recognition(self, image, testing_mode=False):
        """Compute the homography using the running engine.
        Computation is made between the image from the video stream and
        the image that have been learn with its id.

        Keyword arguments:
        pov_id -> int for the position of the reference in the DB
        image -> int array for the video stream
        """

        # Récupération d'une image, SIFT puis si validé VC léger avec mires auto
        ret_data = {
            "scale": "OK",
            "skew": "OK",
            "translation": {
                "x": "OK",
                "y": "OK"
            },
            "success": False
        }
        sum_distances = 9999
        distances = 9999

        fps = FPS().start()
        nb_matches = 0
        response_type = None
        if self.mte_algo == MTEAlgo.VC_LIKE:
            nb_kp = 300
            nb_matches = 150
            success, response_type, scales, skews, translation, transformed = self.vc_like_engine.\
                find_target(image, self.reference, testing_mode=testing_mode)
            
            # cv2.imshow("VC-like engine", transformed)
        else:
            success, scales, skews, translation, transformed, nb_matches, \
                nb_kp = self.sift_engine.recognition(image, self.reference, self.mte_algo)

        # Fix on portrait image
        if not self.landscape_image:
            h, w = image.shape[:2]
            translation = (translation[1], -1 * translation[0])
            scales = (scales[1], scales[0])
            skews = (skews[1], skews[0])

        scale_x, scale_y = scales
        skew_x, skew_y = skews
        scale = max(scale_x, scale_y)
        skew = max(skew_x, skew_y)

        # ML validation
        ml_success = False
        if success:
            ml_success, sum_distances, distances = self.ml_validator.\
                validate(self.reference, transformed)

        fps.update()
        fps.stop()

        if not ml_success:
            # Scale
            if scale < SIFTEngine.HOMOGRAPHY_MIN_SCALE:
                ret_data["scale"] = "far"
            elif scale > SIFTEngine.HOMOGRAPHY_MAX_SCALE:
                ret_data["scale"] = "close"

            if self.mte_algo == MTEAlgo.SIFT_KNN or self.mte_algo == MTEAlgo.SIFT_RANSAC:
                # Skew
                if -1*SIFTEngine.HOMOGRAPHY_MAX_SKEW > skew:
                    ret_data["skew"] = "minus"
                elif skew > SIFTEngine.HOMOGRAPHY_MAX_SKEW:
                    ret_data["skew"] = "plus"

                # Translation
                if translation[0] < SIFTEngine.HOMOGRAPHY_MIN_TRANS:
                    ret_data["translation"]["x"] = "minus"
                elif translation[0] > SIFTEngine.HOMOGRAPHY_MAX_TRANS:
                    ret_data["translation"]["x"] = "plus"

                if translation[1] < SIFTEngine.HOMOGRAPHY_MIN_TRANS:
                    ret_data["translation"]["y"] = "minus"
                elif translation[1] > SIFTEngine.HOMOGRAPHY_MAX_TRANS:
                    ret_data["translation"]["y"] = "plus"

        # cv2.imshow("Transformed", transformed)
        # cv2.waitKey(1)

        ret_data["success"] = success and ml_success

        if self.mte_algo == MTEAlgo.VC_LIKE:
            return success, ret_data, nb_kp, nb_matches, sum(translation),\
            sum(skews), sum_distances, distances, transformed, scales, translation, response_type
        else:
            return success, ret_data, nb_kp, nb_matches, sum(translation),\
            sum(skews), sum_distances, distances, transformed, scales, translation

def str2bool(string_value):
    """Convert a string to a bool."""

    if isinstance(string_value, bool):
        return string_value
    if string_value.lower() in ('yes', 'true', 't', 'y', '1', 'oui', 'o', 'vrai', 'v'):
        return True
    elif string_value.lower() in ('no', 'false', 'f', 'n', '0', 'non', 'faux'):
        return False
    else:
        raise argparse.ArgumentTypeError('Boolean value expected.')

if __name__ == "__main__":
    def convert_to_float(frac_str):
        """Convert a fraction written as string to a float"""

        try:
            return float(frac_str)
        except ValueError:
            num, denom = frac_str.split('/')
            try:
                leading, num = num.split(' ')
                whole = float(leading)
            except ValueError:
                whole = 0
            frac = float(num) / float(denom)
            return whole - frac if whole < 0 else whole + frac

    ap = argparse.ArgumentParser()
    ap.add_argument("-a", "--algo", required=False, default="VC_LIKE",\
        help="Feature detection algorithm (SIFT_KNN, SIFT_RANSAC or VC_LIKE). Default: VC_LIKE")
    ap.add_argument("-c", "--crop", required=False, default="1/6",\
        help="Part to crop around the center of the image (1/6, 1/4 or 0)? Used in SIFT engine. Default: 1/6")
    # ap.add_argument("-w", "--width", required=False, default=380, type=int,\
    #     help="Width of the input image (640, 380 or 320) for D2NET engine. Default: 380")
    ap.add_argument("-r", "--ransacount", required=False, default=300, type=int,\
        help="Number of randomize samples for Ransac evaluation. Default: 300")
    ap.add_argument("-b", "--disable_blur", required=False, type=str2bool, nargs='?',\
        const=True, default=False,\
        help="Disable the blur condition to capture. Default: False")
    ap.add_argument("-ct", "--disable_centering", required=False, type=str2bool, nargs='?',\
        const=True, default=False,\
        help="Disable the centering condition to capture. Default: False")
    ap.add_argument("-m", "--disable_histogram_matching", required=False, type=str2bool, nargs='?',\
        const=True, default=False,\
        help="Disable the histogram matching. Default: False")
    ap.add_argument("-o", "--oneshot", required=False, type=str2bool, nargs='?',\
        const=True, default=False,\
        help="Pass every step possible each time in VC-like mode. Use only with slow connection. Default: False")
    ap.add_argument("-d", "--debug", required=False, type=str2bool, nargs='?',\
        const=True, default=False,\
        help="Display debug images. Do not use with Docker. Default: False")
    args = vars(ap.parse_args())

    mte = MTE(mte_algo=MTEAlgo[args["algo"]], crop_margin=convert_to_float(args["crop"]),\
         ransacount=args["ransacount"], disable_blur=args["disable_blur"], disable_centering=args["disable_centering"], \
         one_shot_mode=args["oneshot"], disable_histogram_matching=args["disable_histogram_matching"], debug_mode=args["debug"])
    mte.listen_images()