######################################################################
# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved. #
# SPDX-License-Identifier: MIT-0                                     #
######################################################################

import copy
import os
import json
import sys
import grpc
import argparse
import numpy as np
import pandas as pd
from tqdm import tqdm
import matplotlib.pyplot as plt
from lib.util.dict_util import dict_merge, flatten_dol, unflatten_dol
from sobol_sensitivity import SobolSensitivity
from chord import chordDiagram
sys.path.append("/app/grpc_compiled")

from grpc_compiled import model_interface_pb2, model_interface_pb2_grpc
from lib.util.encode_decode_json import utf_encode_json, utf_decode_json
from lib.grpc.retry_interceptor import RetryOnRpcErrorClientInterceptor, ExponentialBackoff

def _run_prediction(stub, model_dict):
    model_dict_enc = utf_encode_json(model_dict)
    query = model_interface_pb2.inRequest(inp_dict_bytes=model_dict_enc)
    response = stub.EvaluateModel(query)
    response_dict = utf_decode_json(response.response_bytes)

    return response_dict

def run_task(task_dict, hostname, port, **kwargs):

    # import debugpy; debugpy.listen(('0.0.0.0',5677)); debugpy.wait_for_client(); breakpoint()

    # Location has to flow in formally
    name_port = '%s:%s'%(hostname, port)

    # https://github.com/grpc/grpc/issues/19514
    interceptors = (
        RetryOnRpcErrorClientInterceptor(
            max_attempts=5,
            sleeping_policy=ExponentialBackoff(init_backoff_ms=1000, max_backoff_ms=30000, multiplier=2),
            status_for_retry=(grpc.StatusCode.UNAVAILABLE,),
        ),
    )
    stub = model_interface_pb2_grpc.ModelServiceStub(
        grpc.intercept_channel(grpc.insecure_channel(name_port), *interceptors)
    )
    # stub = model_interface_pb2_grpc.ModelServiceStub(channel)

    # channel = grpc.insecure_channel(name_port)
    # stub = model_interface_pb2_grpc.ModelServiceStub(channel)

    # Get the analyticSettings of the model
    task_analyticSettings = task_dict['analyticSettings']
    model_dict = task_analyticSettings['model']
    model_analyticSettings = model_dict['analyticSettings']
    tunableParams = model_analyticSettings['tunableParams']

    num_samples = task_analyticSettings['num_samples']
    num_splits = task_analyticSettings['num_splits']

    # Output the dictionary at the target location
    rel_dest_path = task_analyticSettings['rel_dest_path']
    file_list = []
    pm_root_path=os.getenv('PM_ROOT_PATH',default='wd')
    dest_path_full = '%s/%s'%(pm_root_path,rel_dest_path)
    os.makedirs(dest_path_full, exist_ok=True)

    # Pick the representative input that can be passed into the prediction request
    subselect_inputs = {}
    inputs_min_dict = {}
    inputs_max_dict = {}
    inputs_name_list = list(task_dict['inputs'].keys())
    for k, v in task_dict['inputs'].items():
        subselect_inputs[k] = [task_dict['inputs'][k][0]]
        inputs_min_dict[k] = np.min(task_dict['inputs'][k])
        inputs_max_dict[k] = np.max(task_dict['inputs'][k])

    # Save the map
    percent_range = task_analyticSettings['percent_range']
    _tunableParams_flat, _tunableParams_name_flat, _tunableParams_map = flatten_dol(tunableParams)
    _tunableParams_flat_min = [x * (1.0 - percent_range/100.) for x in _tunableParams_flat]
    _tunableParams_flat_max = [x * (1.0 + percent_range/100.) for x in _tunableParams_flat]
    n_tunableParams = len(_tunableParams_name_flat)
    _inputParams_flat, _inputParams_name_flat, _inputParams_map = flatten_dol(subselect_inputs)
    _inputParams_flat_min = [inputs_min_dict[x] for x in inputs_name_list]
    _inputParams_flat_max = [inputs_max_dict[x] for x in inputs_name_list]
    n_inputs = len(_inputParams_name_flat)

    # _inputParams = list(task_dict['inputs'].keys())
    # _inputParams_len = len(_inputParams)
    # _inputParams_flat = [task_dict['inputs'][k][0] for k in _inputParams]

    # overallParams_flat = []
    # overallParams_name_flat = []
    # if(task_analyticSettings['sensitivityParams']['model']):
    #     overallParams_flat.extend(_tunableParams_flat.copy())
    #     overallParams_name_flat.extend(_tunableParams_name_flat)
    # if(task_analyticSettings['sensitivityParams']['inputs']):
    #     overallParams_flat.extend(_inputParams_flat.copy())
    #     overallParams_name_flat.extend(_inputParams_name_flat)
    #
    # overall_flat_min = [x * (1.0 - percent_range/100.) for x in overallParams_flat]
    # overall_flat_max = [x * (1.0 + percent_range/100.) for x in overallParams_flat]

    overallParams_name_flat = []
    overallParams_name_flat.extend(_tunableParams_name_flat)
    overallParams_name_flat.extend(_inputParams_name_flat)
    overall_flat_min = []
    overall_flat_min.extend(_tunableParams_flat_min)
    overall_flat_min.extend(_inputParams_flat_min)
    overall_flat_max = []
    overall_flat_max.extend(_tunableParams_flat_max)
    overall_flat_max.extend(_inputParams_flat_max)

    # To prevent singular values of min and max being the same.. move the values by +epsilon and -epsilon
    epsilon = 0.001
    overall_flat_min = [x - epsilon for x in overall_flat_min]
    overall_flat_max = [x - epsilon for x in overall_flat_max]


    loc_ss = SobolSensitivity(np.vstack([np.array(overall_flat_min), np.array(overall_flat_max)]),
                              feat_list=overallParams_name_flat,
                              group_map=None)

    # Generate the Saltelli Samples
    num_samples_per_split = int(num_samples / num_splits)

    ret_dict = []
    overall_out_array_list = []
    for idx_delta_sample in range(num_splits):
        print('Generating Sample Split Group: %d / %d'%(idx_delta_sample, num_splits))
        calc_idx_ss = idx_delta_sample * num_samples_per_split

        out_array = loc_ss.generate_samples_partial(n_samples=num_samples,
                                                    n_partial=num_samples_per_split,
                                                    idx_partial=calc_idx_ss)

        overall_out_array_list.append(out_array)

    overall_out_array = np.vstack(overall_out_array_list)

    # Dump the samples to a file for the user
    temp_overall_pd = pd.DataFrame(data=overall_out_array, columns=overallParams_name_flat)
    out_samples_file_path = '%s/salitelli_samples.csv'%(dest_path_full)
    temp_overall_pd.to_csv(out_samples_file_path)
    file_list.append(out_samples_file_path)

    (nrows, ncols) = overall_out_array.shape
    print('Saltelli Sampling Size: (%d, %d)'%(nrows, ncols))
    # Convert each row into a tunable_params dict along with idx
    # the idx will be ignored if it is a scalar
    response_dict_list = []
    for cur_idx in tqdm(range(nrows)):
        model_dict_clone = copy.deepcopy(model_dict)

        # cur_idx = idx_delta_sample * nrows + cur_delta_idx

        candidate_sample_list = list(overall_out_array[cur_idx, :])

        tunableParam_dict = {
            # "idx_passthrough": cur_idx
        }
        for k, v in _tunableParams_map.items():
            tunableParam_dict[k] = list([candidate_sample_list[i] for i in v])

        model_dict_clone['analyticSettings']['tunableParams'] = tunableParam_dict

        # If inputs are part of the analysis, otherwise leave it at default
        # if (task_analyticSettings['sensitivityParams']['inputs']):
        # Compose the inputs dictionary
        inputs_dict = {}
        # the value array index is relative to the inputs.. so offset it by n_tunableParams
        for k, v in _inputParams_map.items():
            inputs_dict[k] = list([candidate_sample_list[n_tunableParams + i] for i in v])
        model_dict_clone['inputs'] = inputs_dict
        # else:
        #     model_dict_clone['inputs'] = subselect_inputs

        # Run the model for the current sample
        _loc_response_dict = _run_prediction(stub, model_dict=model_dict_clone)
        response_dict_list.append(_loc_response_dict)

    print('Evaluation of Samples completed')

    out_samples_eval_file_path = '%s/salitelli_eval.csv'%(dest_path_full)
    with open(out_samples_eval_file_path, 'w') as fp:
        json.dump(response_dict_list, fp)
    file_list.append(out_samples_eval_file_path)

    # Extract the outputs and run the sensitivity calculation using the same sobol problem
    # Assemble the outputs into a list of dictionaries so that we can convert into a PD
    consolidated_output_lod = []
    for cur_item in response_dict_list:
        # Flatten the lists by the variables
        add_item = {}
        for k, v in cur_item['prediction'].items():
            if isinstance(v, list):
                add_item[k] = v[0] # Sobol eval is done for one sample at a time
            else:
                add_item[k] = v
        consolidated_output_lod.append(add_item)

    output_pd = pd.DataFrame.from_dict(consolidated_output_lod)
    # Sort the output_pd by the idx_passThrough (and dump the
    # output_pd_sorted = output_pd.sort_values(by='idx_passthrough').set_index('idx_passthrough')

    # Output Keys
    output_keys_list = output_pd.columns # output_pd_sorted.columns
    ret_dict = {}
    for k in output_keys_list:
        ret_dict[k] = loc_ss.analyze_problem(output_pd[k].values)

    result_json_filepath_full = '%s/sensitivity_results.json'%(dest_path_full)
    with open(result_json_filepath_full, 'w') as fp:
        json.dump(ret_dict, fp)
        print('Exported: %s'%(result_json_filepath_full))
    file_list.append(result_json_filepath_full)

    # Generate the bar and chord plots
    for k, v in ret_dict.items():
        # Generate the plot for the First order sensitivities
        width = 0.3
        fig, ax = plt.subplots(1, 1, sharex=True)
        n_vars = len(overallParams_name_flat)
        ax.bar(np.arange(n_vars)-width/2, v['first_order'], width, label='first_order')
        ax.bar(np.arange(n_vars)+width/2, v['total_effect'], width, label='total_effect')
        ax.set_title('Sensitivity: %s'%(k))
        ax.set_xticks(np.arange(n_vars), labels=overallParams_name_flat)
        ax.legend()
        ax.grid()
        plt.xticks(rotation=90)
        plt.tight_layout()
        fig.savefig('%s/%s_total_first_order.png' % (dest_path_full, k))
        plt.close(fig)

        # Generate the Chord Diagram
        fig = plt.figure(figsize=(8, 8))
        flux = np.array(v['second_order'])
        ax = plt.axes([0,0,1,1])
        nodePos = chordDiagram(flux, ax)
        ax.axis('off')
        prop = dict(fontsize=16*0.8, ha='center', va='center')
        nodes = overallParams_name_flat
        for i in range(n_vars):
            ax.text(nodePos[i][0], nodePos[i][1], nodes[i], rotation=nodePos[i][2]+90, **prop)

        plt.savefig("%s/%s_interaction.png"%(dest_path_full, k), dpi=100,
                bbox_inches='tight', pad_inches=0.1)
        plt.close(fig)

    meta_data_filepath_full = '%s/metadata.json'%(dest_path_full)
    add_metadata = {
        'description': 'Sensitivity Analysis',
        'filename':'metadata.json'
    }
    meta_data_dict = {
        'metadata': {**ret_dict, **add_metadata},
        'file_list': file_list
    }
    with open(meta_data_filepath_full, 'w') as fp:
        json.dump(meta_data_dict, fp)
        print('Exported: %s' % (meta_data_filepath_full))

if __name__ == "__main__":
    parser = argparse.ArgumentParser()
    parser.add_argument('--config', help='Relative path to the json file describing this model build task')
    args = parser.parse_args()

    task_json_path_full = '%s' % (args.config)
    with open(task_json_path_full, 'r') as fp:
        task_dict = json.load(fp)

    # Extract the data and model locations
    # Update it back in the task dict
    # TODO: A cleaner segregation is needed here
    rel_data_path = task_dict['analyticSettings']['rel_data_path']
    # rel_model_path = task_dict['analyticSettings']['rel_model_path']
    rel_service_path = task_dict['analyticSettings']['rel_service_path']
    pm_root_path=os.getenv('PM_ROT_PATH',default='wd')
    data_metadata_json = '%s/%s/metadata.json'%(pm_root_path,rel_data_path)
    with open(data_metadata_json, 'r') as fp:
        data_metadata_dict = json.load(fp)

    data_filename = data_metadata_dict['metadata']['filename']
    with open('%s/%s/%s'%(pm_root_path,rel_data_path, data_filename), 'r') as fp:
        data_dict = json.load(fp)

    #
    # with open('%s/data.json'%(rel_data_path), 'r') as fp:
    #     data_dict = json.load(fp)
    # with open('%s/model.json'%(rel_model_path), 'r') as fp:
    #     model_dict = json.load(fp)
    with open('%s/%s/metadata.json'%(pm_root_path,rel_service_path), 'r') as fp:
        service_dict = json.load(fp)

    dict_merge(task_dict, data_dict)
    # Get the model dict from the service metadata instead of a model node
    # task_dict['analyticSettings']['model'] = model_dict
    task_dict['analyticSettings']['model'] = service_dict['metadata']['model']

    run_task(task_dict,service_dict['metadata']['name'], service_dict['metadata']['port_internal'])