# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
# SPDX-License-Identifier: Apache-2.0

###############################################################################
# PURPOSE:
#   Lambda function to check the status of a Rekognition job and save that job's
#   data to the MI dataplane when the job is complete.
###############################################################################

import os
import boto3
import json
from botocore import config
from aws_xray_sdk.core import xray_recorder
from aws_xray_sdk.core import patch_all
from MediaInsightsEngineLambdaHelper import OutputHelper
from MediaInsightsEngineLambdaHelper import MasExecutionError
from MediaInsightsEngineLambdaHelper import DataPlane

patch_all()

operator_name = os.environ['OPERATOR_NAME']
output_object = OutputHelper(operator_name)

mie_config = json.loads(os.environ['botoConfig'])
config = config.Config(**mie_config)
rek = boto3.client('rekognition', config=config)


def get_status(event, get_rek_status, metadata_error_key):
    """Handles requests to check rekognition status.

    Parameters:
        event (dict): The unmodified event from the lambda function handler.
        get_rek_status ((**kwargs) => dict): rekognition method to call for status.
        metadata_error_key (str): Key name used for errors reported via OutputHelper.add_workflow_metadata().

    Raises:
        MasExecutionError: Something went wrong.

    Returns:
        dict: Result of OutputHelper.return_output_object()
    """
    print("We got the following event:\n", event)

    error_message_format = "Missing key {e}"
    try:
        status = event["Status"]
        metadata = event['MetaData']
        asset_id = metadata['AssetId']

        # Images will have already been processed, so return if job status is already set.
        if status == "Complete":
            output_object.update_workflow_status("Complete")
            return output_object.return_output_object()

        error_message_format = "Missing a required metadata key {e}"
        job_id = metadata["JobId"]
        workflow_id = metadata["WorkflowExecutionId"]

    except KeyError as e:
        output_object.update_workflow_status("Error")
        output_object.add_workflow_metadata(**{metadata_error_key: error_message_format.format(e=e)})
        raise MasExecutionError(output_object.return_output_object())

    # Check rekognition job status:
    dataplane = DataPlane()
    # If pagination token is in metadata then use that to start
    # reading reko results from where this Lambda's previous invocation left off.
    pagination_token = metadata.get("PageToken", '')
    is_paginated = "PageToken" in metadata

    # Read and persist 10 reko pages per invocation of this Lambda
    for _ in range(11):
        # Get reko results
        print("job id: " + job_id + " page token: " + pagination_token)
        try:
            response = get_rek_status(JobId=job_id, NextToken=pagination_token)
        except rek.exceptions.InvalidPaginationTokenException as e:
            # Trying to reverse seek to the last valid pagination token would be difficult
            # to implement, so in the rare case that a pagination token expires we'll
            # just start over by reading from the first page.
            print(e)
            print("WARNING: Invalid pagination token found. Restarting read from first page.")
            pagination_token = ''
            continue

        # If the reko job is IN_PROGRESS then return. We'll check again after a step function wait.
        if response['JobStatus'] == "IN_PROGRESS":
            output_object.update_workflow_status("Executing")
            output_object.add_workflow_metadata(JobId=job_id, AssetId=asset_id, WorkflowExecutionId=workflow_id)
            return output_object.return_output_object()

        # If the reko job is FAILED then mark the workflow status as Error and return.
        elif response['JobStatus'] == "FAILED":
            output_object.update_workflow_status("Error")
            output_object.add_workflow_metadata(JobId=job_id, **{metadata_error_key: str(response["StatusMessage"])})
            raise MasExecutionError(output_object.return_output_object())

        # If reko job status is not SUCCEEDED, then mark workflow as failed
        elif response['JobStatus'] != "SUCCEEDED":
            output_object.update_workflow_status("Error")
            output_object.add_workflow_metadata(**{metadata_error_key: "Unable to determine status"})
            raise MasExecutionError(output_object.return_output_object())

        # The reko job is SUCCEEDED so save this current reko page result
        # and continue to next page_number.

        # If we were paging and there is no next token, we reached the end.
        have_next_token = 'NextToken' in response
        is_end = is_paginated and not have_next_token
        # If we were paging or need to start, is_paginated needs to reflect that.
        is_paginated = is_paginated or have_next_token

        # Persist rekognition results (current page)
        # If we've been saving pages, then tell dataplane this is the last page
        metadata_upload = dataplane.store_asset_metadata(asset_id=asset_id, operator_name=operator_name, workflow_id=workflow_id, results=response, paginate=is_paginated, end=is_end)

        # If dataplane request failed then mark workflow as failed
        if metadata_upload.get("Status", '') != "Success":
            output_object.update_workflow_status("Error")
            output_object.add_workflow_metadata(**{metadata_error_key: "Unable to upload metadata for {asset}: {error}".format(asset=asset_id, error=metadata_upload)}, JobId=job_id)
            raise MasExecutionError(output_object.return_output_object())

        # Log that this page has been successfully uploaded to the dataplane
        print("Uploaded metadata for asset: {asset}, job {JobId}, page {page}".format(asset=asset_id, JobId=job_id, page=pagination_token))

        # Get the next pagination token if it exists:
        pagination_token = response.get('NextToken', '')

        # If reko results didn't contain more pages, we're done; mark the stage as complete.
        if not have_next_token:
            output_object.add_workflow_metadata(JobId=job_id)
            output_object.update_workflow_status("Complete")
            return output_object.return_output_object()

    # In order to avoid Lambda timeouts, we're only going to persist 10 pages then
    # pass the pagination token to the workflow metadata and let our step function
    # invoker restart this Lambda. The pagination token allows this Lambda
    # continue from where it left off.
    output_object.update_workflow_status("Executing")
    output_object.add_workflow_metadata(PageToken=pagination_token, JobId=job_id, AssetId=asset_id, WorkflowExecutionId=workflow_id)
    return output_object.return_output_object()


###############################################################################
# AWS Lambda Handlers
###############################################################################

def check_content_moderation_status(event, _context):
    """Lambda function handler for checking content moderation status."""
    return get_status(event, rek.get_content_moderation, 'ContentModerationError')


def check_celebrity_recognition_status(event, _context):
    """Lambda function handler for checking celebrity recognition status."""
    return get_status(event, rek.get_celebrity_recognition, 'CelebrityRecognitionError')


def check_face_detection_status(event, _context):
    """Lambda function handler for checking face detection status."""
    return get_status(event, rek.get_face_detection, 'FaceDetectionError')


def check_face_search_status(event, _context):
    """Lambda function handler for checking face search status."""
    return get_status(event, rek.get_face_search, 'FaceSearchError')


def check_label_detection_status(event, _context):
    """Lambda function handler for checking label detection status."""
    return get_status(event, rek.get_label_detection, 'LabelDetectionError')


def check_person_tracking_status(event, _context):
    """Lambda function handler for checking person tracking status."""
    return get_status(event, rek.get_person_tracking, 'PersonTrackingError')


def check_shot_detection_status(event, _context):
    """Lambda function handler for checking shot detection status."""
    return get_status(event, rek.get_segment_detection, 'LabelDetectionError')


def check_technical_cue_status(event, _context):
    """Lambda function handler for checking technical cue status."""
    return get_status(event, rek.get_segment_detection, 'TechnicalCueDetectionError')


def check_text_detection_status(event, _context):
    """Lambda function handler for checking text detection status."""
    return get_status(event, rek.get_text_detection, 'TextDetectionError')