#!/usr/bin/env python3

supported_extensions = ['jpeg', 'jpg', 'gif', 'png']

import errno
import os
import json

import numpy as np
import cv2


# Load and preprocess image
def load_image(image_path,                # Full path to processing image
               target_size,               # Desired size of resulting image
               data_type = 'uint8',       # Data type to store
               convert_to_bgr = False,    # Swap image channel RGB -> BGR
               normalize_data = False,    # Normalize the data   = os.getenv('_NORMALIZE_DATA') in ('YES', 'yes', 'ON', 'on', '1')
               normalize_lower = -1,      # Normalize - lower limit
               normalize_upper = 1,       # Normalize - upper limit
               subtract_mean = False,     # Subtract mean
               given_channel_means = '',  # Given channel means
               quantize = 0,              # Quantization type, 1 for quantize to int8 
               quant_scale = 1,           # Quantization scale 
               quant_offset = 0,          # Quantization offset 
               convert_to_unsigned  = 0   # 1 to convert from int to uint
              ):

    image = cv2.imread(image_path)

    if len(image.shape) < 3 or image.shape[2] != 3:
        image = cv2.cvtColor(image, cv2.COLOR_GRAY2RGB)
    else:
        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)

    original_height, original_width, _ = image.shape

#    image_id = ck_utils.filename_to_id(image_file, DATASET_TYPE)
#    processed_image_ids.append(image_id)

    # The array based representation of the image will be used later
    # in order to prepare the result image with boxes and labels on it.

    image = cv2.resize(image, (target_size, target_size), interpolation=cv2.INTER_LINEAR)

    # Convert to NumPy array
    img = np.asarray(image, np.float32)

    if convert_to_bgr:
        img = img[...,::-1]     # swapping Red and Blue colour channels

    img = img.astype(np.float32)

    # Normalize
    if normalize_data:
        img = img*((normalize_upper-normalize_lower)/255.0)+normalize_lower

    # Subtract mean value
    if subtract_mean:
        if len(given_channel_means):
            img -= given_channel_means
        else:
            img -= np.mean(img, axis=(0,1), keepdims=True)

    if len(given_channel_stds):
        img /= given_channel_stds

    if data_layout == 'NCHW':
        img = img.transpose(2,0,1)
    elif data_layout == 'CHW4':
        img = np.pad(img, ((0,0), (0,0), (0,1)), 'constant')

    # Value 1 for quantization to int8
    if quantize == 1:
        img = quantize_to_int8(img, quant_scale, quant_offset)

    # Value 1 to convert from int8 to uint8
    if convert_to_unsigned == 1:
        img = int8_to_uint8(img)


    # Make batch from single image
    batch_shape = (1, target_size, target_size, 3)
    batch_data = img.reshape(batch_shape)

    return batch_data, original_width, original_height

def quantize_to_int8(image, scale, offset):
    quant_image = (image/scale + offset).astype(np.float32)
    output = np.copy(quant_image)
    gtZero = (quant_image > 0).astype(int)
    gtZero = gtZero * 0.5
    output=output+gtZero
    ltZero = (quant_image < 0).astype(int)
    ltZero = ltZero * (-0.5)
    output=output+ltZero
    return output.astype(np.int8)


def int8_to_uint8(image):
    image = (image+128).astype(np.uint8)
    return image


def preprocess_files(selected_filenames,
                     source_dir,
                     destination_dir,
                     square_side,
                     data_type,
                     convert_to_bgr,
                     normalize_data,
                     normalize_lower,
                     normalize_upper,
                     subtract_mean,
                     given_channel_means,
                     quantize,
                     quant_scale, 
                     quant_offset, 
                     convert_to_unsigned,
                     new_file_extension):

    "Go through the selected_filenames and preprocess all the files"

    output_signatures = []

    for current_idx in range(len(selected_filenames)):
        input_filename = selected_filenames[current_idx]

        full_input_path     = os.path.join(source_dir, input_filename)

        image_data, original_width, original_height = load_image(image_path = full_input_path,
                                                                 target_size = square_side,
                                                                 data_type = data_type,
                                                                 convert_to_bgr = convert_to_bgr,
                                                                 normalize_data = normalize_data,
                                                                 normalize_lower = normalize_lower,
                                                                 normalize_upper = normalize_upper,
                                                                 subtract_mean = subtract_mean,
                                                                 given_channel_means = given_channel_means,
                                                                 quantize = quantize,
                                                                 quant_scale = quant_scale, 
                                                                 quant_offset = quant_offset, 
                                                                 convert_to_unsigned = convert_to_unsigned)

        output_filename = input_filename.rsplit('.', 1)[0] + '.' + new_file_extension if new_file_extension else input_filename

        full_output_path    = os.path.join(destination_dir, output_filename)
        image_data.tofile(full_output_path)

        print("[{}]:  Stored {}".format(current_idx+1, full_output_path) )

        output_signatures.append('{};{};{}'.format(output_filename, original_width, original_height) )

    return output_signatures


## Internal processing:
#
INTERMEDIATE_DATA_TYPE  = np.float32    # default for internal conversion
#INTERMEDIATE_DATA_TYPE  = np.int8       # affects the accuracy a bit

if __name__ == '__main__':
    import sys

    source_dir              = sys.argv[1]   # ignored if CK_IMAGE_FILE points to a file
    destination_dir         = sys.argv[2]

    square_side             = int( os.environ['_INPUT_SQUARE_SIDE'] )
    offset                  = int( os.getenv('_SUBSET_OFFSET', 0) )
    volume_str              = os.getenv('_SUBSET_VOLUME', '' )
    fof_name                = os.getenv('_SUBSET_FOF', 'fof.txt')
    data_type               = os.getenv('_DATA_TYPE', 'uint8')
    new_file_extension      = os.getenv('_NEW_EXTENSION', '')
    image_file              = os.getenv('CK_IMAGE_FILE', '')

    data_layout             = os.getenv('_DATA_LAYOUT', 'NHWC')
    convert_to_bgr          = os.getenv('_COLOUR_CHANNELS_BGR', 'NO') in ('YES', 'yes', 'ON', 'on', '1')
    input_data_type         = os.getenv('_INPUT_DATA_TYPE', 'float32')

    ## Image normalization:
    #
    normalize_data    = os.getenv('_NORMALIZE_DATA') in ('YES', 'yes', 'ON', 'on', '1')
    normalize_lower   = float(os.getenv('_NORMALIZE_LOWER', -1.0))
    normalize_upper   = float(os.getenv('_NORMALIZE_UPPER',  1.0))
    subtract_mean           = os.getenv('_SUBTRACT_MEAN', 'NO') in ('YES', 'yes', 'ON', 'on', '1')
    given_channel_means     = os.getenv('_GIVEN_CHANNEL_MEANS', '')
    quant_scale             = float( os.environ['_QUANT_SCALE'] )
    quant_offset            = float( os.environ['_QUANT_OFFSET'] )
    quantize                = int( os.environ['_QUANTIZE'] ) #1 for quantize to int8
    convert_to_unsigned     = int( os.environ['_CONVERT_TO_UNSIGNED'] ) #1 for int8 to uint8

    if given_channel_means:
        given_channel_means = np.fromstring(given_channel_means, dtype=np.float32, sep=' ').astype(INTERMEDIATE_DATA_TYPE)
        if convert_to_bgr:
            given_channel_means = given_channel_means[::-1]     # swapping Red and Blue colour channels

    given_channel_stds      = os.getenv('_GIVEN_CHANNEL_STDS', '')
    if given_channel_stds:
        given_channel_stds = np.fromstring(given_channel_stds, dtype=np.float32, sep=' ').astype(INTERMEDIATE_DATA_TYPE)
        if convert_to_bgr:
            given_channel_stds  = given_channel_stds[::-1]      # swapping Red and Blue colour channels


    print("From: {} , To: {} , Size: {} ,  OFF: {}, VOL: '{}', FOF: {}, DTYPE: {}, EXT: {}, IMG: {}".format(
        source_dir, destination_dir, square_side, offset, volume_str, fof_name, data_type, new_file_extension, image_file) )

    if image_file:
        source_dir          = os.path.dirname(image_file)
        selected_filenames  = [ os.path.basename(image_file) ]

    else:
        annotations_filepath = os.getenv('CK_ENV_DATASET_ANNOTATIONS')
        calibration = os.path.exists( os.path.join( os.getenv('CK_ENV_DATASET_IMAGE_DIR'), 'coco_cal_images_list.txt' ) )

        if annotations_filepath and not calibration:  # get the "coco-natural" filename order (not necessarily alphabetic)
            with open(annotations_filepath, "r") as annotations_fh:
                annotations_struct = json.load(annotations_fh)

            ordered_filenames = [ image_entry['file_name'] for image_entry in annotations_struct['images'] ]

        elif os.path.isdir(source_dir):     # in the absence of "coco-natural", use alphabetic order

            ordered_filenames = [filename for filename in sorted(os.listdir(source_dir)) if any(filename.lower().endswith(extension) for extension in supported_extensions) ]

        else:
            raise FileNotFoundError(errno.ENOENT, os.strerror(errno.ENOENT), source_dir)

        total_volume = len(ordered_filenames)

        if offset<0:        # support offsets "from the right"
            offset += total_volume

        volume = int(volume_str) if len(volume_str)>0 else total_volume-offset

        selected_filenames = ordered_filenames[offset:offset+volume]


    output_signatures = preprocess_files(selected_filenames,
                                         source_dir,
                                         destination_dir,
                                         square_side,
                                         data_type,
                                         convert_to_bgr,
                                         normalize_data,
                                         normalize_lower,
                                         normalize_upper,
                                         subtract_mean,
                                         given_channel_means,
                                         quantize,
                                         quant_scale, 
                                         quant_offset, 
                                         convert_to_unsigned,
                                         new_file_extension)

    fof_full_path = os.path.join(destination_dir, fof_name)
    with open(fof_full_path, 'w') as fof:
        for filename in output_signatures:
            fof.write(filename + '\n')