# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"). You
# may not use this file except in compliance with the License. A copy of
# the License is located at
#
#     http://aws.amazon.com/apache2.0/
#
# or in the "license" file accompanying this file. This file is
# distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF
# ANY KIND, either express or implied. See the License for the specific
# language governing permissions and limitations under the License.
from __future__ import absolute_import

import datetime
import unittest
import cloudpickle
from math import inf, nan
from unittest.mock import patch, Mock, MagicMock

import dateutil
import pytest

from sagemaker.experiments import _environment, SortOrderType
from sagemaker.experiments._api_types import (
    TrialComponentArtifact,
    TrialComponentSummary,
    TrialComponentStatus,
    _TrialComponentStatusType,
    TrialComponentSearchResult,
)
from sagemaker.experiments.experiment import Experiment
from sagemaker.experiments.run import (
    TRIAL_NAME_TEMPLATE,
    MAX_RUN_TC_ARTIFACTS_LEN,
    MAX_NAME_LEN_IN_BACKEND,
    EXPERIMENT_NAME,
    RUN_NAME,
    TRIAL_NAME,
    DELIMITER,
    RUN_TC_TAG,
    SortByType,
)
from sagemaker.experiments import Run, load_run, list_runs
from sagemaker.experiments.trial import _Trial
from sagemaker.experiments.trial_component import _TrialComponent
from sagemaker.experiments._helper import _DEFAULT_ARTIFACT_PREFIX
from tests.unit.sagemaker.experiments.helpers import (
    mock_trial_load_or_create_func,
    mock_tc_load_or_create_func,
    TEST_EXP_NAME,
    TEST_EXP_NAME_MIXED_CASE,
    TEST_RUN_NAME,
    TEST_EXP_DISPLAY_NAME,
    TEST_RUN_DISPLAY_NAME,
    TEST_ARTIFACT_BUCKET,
    TEST_ARTIFACT_PREFIX,
)


@pytest.mark.parametrize(
    ("kwargs", "expected_artifact_bucket", "expected_artifact_prefix"),
    [
        ({}, None, _DEFAULT_ARTIFACT_PREFIX),
        (
            {
                "artifact_bucket": TEST_ARTIFACT_BUCKET,
                "artifact_prefix": TEST_ARTIFACT_PREFIX,
            },
            TEST_ARTIFACT_BUCKET,
            TEST_ARTIFACT_PREFIX,
        ),
    ],
)
@patch(
    "sagemaker.experiments.run.Experiment._load_or_create",
    MagicMock(return_value=Experiment(experiment_name=TEST_EXP_NAME)),
)
@patch(
    "sagemaker.experiments.run._Trial._load_or_create",
    MagicMock(side_effect=mock_trial_load_or_create_func),
)
@patch.object(_Trial, "add_trial_component", MagicMock(return_value=None))
@patch(
    "sagemaker.experiments.run._TrialComponent._load_or_create",
    MagicMock(side_effect=mock_tc_load_or_create_func),
)
@patch.object(_TrialComponent, "save")
def test_run_init(
    mock_tc_save,
    sagemaker_session,
    kwargs,
    expected_artifact_bucket,
    expected_artifact_prefix,
):
    sagemaker_session.sagemaker_client.search.return_value = {"Results": []}
    with Run(
        experiment_name=TEST_EXP_NAME,
        run_name=TEST_RUN_NAME,
        sagemaker_session=sagemaker_session,
        **kwargs,
    ) as run_obj:
        assert not run_obj._in_load
        assert not run_obj._inside_load_context
        assert run_obj._inside_init_context
        assert not run_obj._trial_component.parameters

        expected_tc_name = f"{TEST_EXP_NAME}{DELIMITER}{TEST_RUN_NAME}"
        assert run_obj.experiment_name == TEST_EXP_NAME
        assert run_obj.run_name == TEST_RUN_NAME
        assert run_obj.run_group_name == TRIAL_NAME_TEMPLATE.format(TEST_EXP_NAME)
        assert run_obj._trial_component.trial_component_name == expected_tc_name
        assert run_obj._trial.trial_name == TRIAL_NAME_TEMPLATE.format(TEST_EXP_NAME)
        assert run_obj._experiment.experiment_name == TEST_EXP_NAME
        assert run_obj.experiment_config == {
            EXPERIMENT_NAME: TEST_EXP_NAME,
            TRIAL_NAME: run_obj.run_group_name,
            RUN_NAME: expected_tc_name,
        }
        assert run_obj._artifact_uploader.artifact_bucket == expected_artifact_bucket
        assert run_obj._artifact_uploader.artifact_prefix == expected_artifact_prefix

    # trail_component.save is called when entering/ exiting the with block
    mock_tc_save.assert_called()
    run_obj._trial.add_trial_component.assert_called()


def test_run_init_name_length_exceed_limit(sagemaker_session):
    invalid_name = "x" * MAX_NAME_LEN_IN_BACKEND

    # experiment_name exceeds
    with pytest.raises(ValueError) as err:
        Run(
            experiment_name=invalid_name,
            run_name=TEST_RUN_NAME,
            sagemaker_session=sagemaker_session,
        )

    assert (
        f"The experiment_name (length: {MAX_NAME_LEN_IN_BACKEND}) must have length less than"
        in str(err)
    )

    # run_name exceeds
    with pytest.raises(ValueError) as err:
        Run(
            experiment_name=TEST_EXP_NAME,
            run_name=invalid_name,
            sagemaker_session=sagemaker_session,
        )

    assert f"The run_name (length: {MAX_NAME_LEN_IN_BACKEND}) must have length less than" in str(
        err
    )


@pytest.mark.parametrize(
    ("kwargs", "expected_artifact_bucket", "expected_artifact_prefix"),
    [
        ({}, None, _DEFAULT_ARTIFACT_PREFIX),
        (
            {
                "artifact_bucket": TEST_ARTIFACT_BUCKET,
                "artifact_prefix": TEST_ARTIFACT_PREFIX,
            },
            TEST_ARTIFACT_BUCKET,
            TEST_ARTIFACT_PREFIX,
        ),
    ],
)
@patch.object(_TrialComponent, "save", MagicMock(return_value=None))
@patch(
    "sagemaker.experiments.run.Experiment._load_or_create",
    MagicMock(return_value=Experiment(experiment_name=TEST_EXP_NAME)),
)
@patch(
    "sagemaker.experiments.run._Trial._load_or_create",
    MagicMock(side_effect=mock_trial_load_or_create_func),
)
@patch.object(_Trial, "add_trial_component", MagicMock(return_value=None))
@patch(
    "sagemaker.experiments.run._TrialComponent._load_or_create",
    MagicMock(side_effect=mock_tc_load_or_create_func),
)
@patch("sagemaker.experiments.run._RunEnvironment")
def test_run_load_no_run_name_and_in_train_job(
    mock_run_env,
    sagemaker_session,
    kwargs,
    expected_artifact_bucket,
    expected_artifact_prefix,
):
    client = sagemaker_session.sagemaker_client
    job_name = "my-train-job"
    rv = Mock()
    rv.source_arn = f"arn:1234/{job_name}"
    rv.environment_type = _environment._EnvironmentType.SageMakerTrainingJob
    mock_run_env.load.return_value = rv

    expected_tc_name = f"{TEST_EXP_NAME}{DELIMITER}{TEST_RUN_NAME}"
    exp_config = {
        EXPERIMENT_NAME: TEST_EXP_NAME,
        TRIAL_NAME: Run._generate_trial_name(TEST_EXP_NAME),
        RUN_NAME: expected_tc_name,
    }
    client.describe_training_job.return_value = {
        "TrainingJobName": "train-job-experiments",
        # The Run object has been created else where
        "ExperimentConfig": exp_config,
    }
    sagemaker_session.sagemaker_client.search.return_value = {
        "Results": [
            {
                "TrialComponent": {
                    "Parents": [
                        {"ExperimentName": TEST_EXP_NAME, "TrialName": exp_config[TRIAL_NAME]}
                    ],
                    "TrialComponentName": expected_tc_name,
                }
            }
        ]
    }
    with load_run(sagemaker_session=sagemaker_session, **kwargs) as run_obj:
        assert run_obj._in_load
        assert not run_obj._inside_init_context
        assert run_obj._inside_load_context
        assert run_obj.run_name == TEST_RUN_NAME
        assert run_obj._trial_component.trial_component_name == expected_tc_name
        assert run_obj.run_group_name == Run._generate_trial_name(TEST_EXP_NAME)
        assert run_obj._trial
        assert run_obj.experiment_name == TEST_EXP_NAME
        assert run_obj._experiment
        assert run_obj.experiment_config == exp_config
        assert run_obj._artifact_uploader.artifact_bucket == expected_artifact_bucket
        assert run_obj._artifact_uploader.artifact_prefix == expected_artifact_prefix

    client.describe_training_job.assert_called_once_with(TrainingJobName=job_name)
    run_obj._trial.add_trial_component.assert_not_called()


@patch("sagemaker.experiments.run._RunEnvironment")
def test_run_load_no_run_name_and_in_train_job_but_fail_to_get_exp_cfg(
    mock_run_env, sagemaker_session
):
    rv = Mock()
    rv.source_arn = "arn:1234/my-train-job"
    rv.environment_type = _environment._EnvironmentType.SageMakerTrainingJob
    mock_run_env.load.return_value = rv

    # No Run object is created else where
    sagemaker_session.sagemaker_client.describe_training_job.return_value = {
        "TrainingJobName": "train-job-experiments",
    }

    with pytest.raises(RuntimeError) as err:
        with load_run(sagemaker_session=sagemaker_session):
            pass

    assert "Not able to fetch RunName in ExperimentConfig of the sagemaker job" in str(err)


def test_run_load_no_run_name_and_not_in_train_job(run_obj, sagemaker_session):
    with run_obj:
        with load_run(sagemaker_session=sagemaker_session) as run:
            assert run_obj == run


def test_run_load_no_run_name_and_not_in_train_job_but_no_obj_in_context(sagemaker_session):
    with pytest.raises(RuntimeError) as err:
        with load_run(sagemaker_session=sagemaker_session):
            pass

    assert "Failed to load a Run object" in str(err)

    # experiment_name is given but is not supplied along with the run_name so it's ignored.
    with pytest.raises(RuntimeError) as err:
        with load_run(experiment_name=TEST_EXP_NAME, sagemaker_session=sagemaker_session):
            pass

    assert "Failed to load a Run object" in str(err)


@pytest.mark.parametrize(
    ("kwargs", "expected_artifact_bucket", "expected_artifact_prefix"),
    [
        ({}, None, _DEFAULT_ARTIFACT_PREFIX),
        (
            {
                "artifact_bucket": TEST_ARTIFACT_BUCKET,
                "artifact_prefix": TEST_ARTIFACT_PREFIX,
            },
            TEST_ARTIFACT_BUCKET,
            TEST_ARTIFACT_PREFIX,
        ),
    ],
)
@patch.object(_TrialComponent, "save", MagicMock(return_value=None))
@patch(
    "sagemaker.experiments.run.Experiment._load_or_create",
    MagicMock(return_value=Experiment(experiment_name=TEST_EXP_NAME)),
)
@patch(
    "sagemaker.experiments.run._Trial._load_or_create",
    MagicMock(side_effect=mock_trial_load_or_create_func),
)
@patch.object(_Trial, "add_trial_component", MagicMock(return_value=None))
@patch(
    "sagemaker.experiments.run._TrialComponent._load_or_create",
    MagicMock(side_effect=mock_tc_load_or_create_func),
)
def test_run_load_with_run_name_and_exp_name(
    sagemaker_session, kwargs, expected_artifact_bucket, expected_artifact_prefix
):
    sagemaker_session.sagemaker_client.search.return_value = {"Results": []}
    with load_run(
        run_name=TEST_RUN_NAME,
        experiment_name=TEST_EXP_NAME,
        sagemaker_session=sagemaker_session,
        **kwargs,
    ) as run_obj:
        expected_tc_name = f"{TEST_EXP_NAME}{DELIMITER}{TEST_RUN_NAME}"
        expected_exp_config = {
            EXPERIMENT_NAME: TEST_EXP_NAME,
            TRIAL_NAME: Run._generate_trial_name(TEST_EXP_NAME),
            RUN_NAME: expected_tc_name,
        }

        assert run_obj.run_name == TEST_RUN_NAME
        assert run_obj.run_group_name == Run._generate_trial_name(TEST_EXP_NAME)
        assert run_obj.experiment_name == TEST_EXP_NAME
        assert run_obj._trial_component.trial_component_name == expected_tc_name
        assert run_obj._trial
        assert run_obj._experiment
        assert run_obj.experiment_config == expected_exp_config
        assert run_obj._artifact_uploader.artifact_bucket == expected_artifact_bucket
        assert run_obj._artifact_uploader.artifact_prefix == expected_artifact_prefix

    run_obj._trial.add_trial_component.assert_called()


def test_run_load_with_run_name_but_no_exp_name(sagemaker_session):
    with pytest.raises(ValueError) as err:
        with load_run(
            run_name=TEST_RUN_NAME,
            sagemaker_session=sagemaker_session,
        ):
            pass

    assert "Invalid input: experiment_name is missing" in str(err)


@patch(
    "sagemaker.experiments.run.Experiment._load_or_create",
    MagicMock(return_value=Experiment(experiment_name=TEST_EXP_NAME)),
)
@patch(
    "sagemaker.experiments.run._Trial._load_or_create",
    MagicMock(side_effect=mock_trial_load_or_create_func),
)
@patch.object(_Trial, "add_trial_component", MagicMock(return_value=None))
@patch(
    "sagemaker.experiments.run._TrialComponent._load_or_create",
    MagicMock(side_effect=mock_tc_load_or_create_func),
)
@patch.object(_TrialComponent, "save", MagicMock(return_value=None))
@patch("sagemaker.experiments.run._RunEnvironment")
def test_run_load_in_sm_processing_job(mock_run_env, sagemaker_session):
    client = sagemaker_session.sagemaker_client
    job_name = "my-process-job"
    rv = unittest.mock.Mock()
    rv.source_arn = f"arn:1234/{job_name}"
    rv.environment_type = _environment._EnvironmentType.SageMakerProcessingJob
    mock_run_env.load.return_value = rv

    expected_tc_name = f"{TEST_EXP_NAME}{DELIMITER}{TEST_RUN_NAME}"
    exp_config = {
        EXPERIMENT_NAME: TEST_EXP_NAME,
        TRIAL_NAME: Run._generate_trial_name(TEST_EXP_NAME),
        RUN_NAME: expected_tc_name,
    }
    client.describe_processing_job.return_value = {
        "ProcessingJobName": "process-job-experiments",
        # The Run object has been created else where
        "ExperimentConfig": exp_config,
    }
    sagemaker_session.sagemaker_client.search.return_value = {
        "Results": [
            {
                "TrialComponent": {
                    "Parents": [
                        {"ExperimentName": TEST_EXP_NAME, "TrialName": exp_config[TRIAL_NAME]}
                    ],
                    "TrialComponentName": expected_tc_name,
                }
            }
        ]
    }

    with load_run(sagemaker_session=sagemaker_session):
        pass

    client.describe_processing_job.assert_called_once_with(ProcessingJobName=job_name)
    mock_run_env._trial.add_trial_component.assert_not_called()


@patch(
    "sagemaker.experiments.run.Experiment._load_or_create",
    MagicMock(return_value=Experiment(experiment_name=TEST_EXP_NAME)),
)
@patch(
    "sagemaker.experiments.run._Trial._load_or_create",
    MagicMock(side_effect=mock_trial_load_or_create_func),
)
@patch.object(_Trial, "add_trial_component", MagicMock(return_value=None))
@patch(
    "sagemaker.experiments.run._TrialComponent._load_or_create",
    MagicMock(side_effect=mock_tc_load_or_create_func),
)
@patch.object(_TrialComponent, "save", MagicMock(return_value=None))
@patch("sagemaker.experiments.run._RunEnvironment")
def test_run_load_in_sm_transform_job(mock_run_env, sagemaker_session):
    client = sagemaker_session.sagemaker_client
    job_name = "my-transform-job"
    rv = unittest.mock.Mock()
    rv.source_arn = f"arn:1234/{job_name}"
    rv.environment_type = _environment._EnvironmentType.SageMakerTransformJob
    mock_run_env.load.return_value = rv

    expected_tc_name = f"{TEST_EXP_NAME}{DELIMITER}{TEST_RUN_NAME}"
    exp_config = {
        EXPERIMENT_NAME: TEST_EXP_NAME,
        TRIAL_NAME: Run._generate_trial_name(TEST_EXP_NAME),
        RUN_NAME: expected_tc_name,
    }
    client.describe_transform_job.return_value = {
        "TransformJobName": "transform-job-experiments",
        # The Run object has been created else where
        "ExperimentConfig": exp_config,
    }
    sagemaker_session.sagemaker_client.search.return_value = {
        "Results": [
            {
                "TrialComponent": {
                    "Parents": [
                        {"ExperimentName": TEST_EXP_NAME, "TrialName": exp_config[TRIAL_NAME]}
                    ],
                    "TrialComponentName": expected_tc_name,
                }
            }
        ]
    }

    with load_run(sagemaker_session=sagemaker_session):
        pass

    client.describe_transform_job.assert_called_once_with(TransformJobName=job_name)
    mock_run_env._trial.add_trial_component.assert_not_called()


@patch(
    "sagemaker.experiments.run.Experiment._load_or_create",
    MagicMock(return_value=Experiment(experiment_name=TEST_EXP_NAME)),
)
@patch(
    "sagemaker.experiments.run._Trial._load_or_create",
    MagicMock(side_effect=mock_trial_load_or_create_func),
)
@patch.object(_Trial, "add_trial_component", MagicMock(return_value=None))
@patch(
    "sagemaker.experiments.run._TrialComponent._load_or_create",
    MagicMock(side_effect=mock_tc_load_or_create_func),
)
@patch.object(_TrialComponent, "save")
def test_run_object_serialize_deserialize(mock_tc_save, sagemaker_session):
    sagemaker_session.sagemaker_client.search.return_value = {"Results": []}
    run_obj = Run(
        experiment_name=TEST_EXP_NAME,
        run_name=TEST_RUN_NAME,
        experiment_display_name=TEST_EXP_DISPLAY_NAME,
        run_display_name=TEST_RUN_DISPLAY_NAME,
        sagemaker_session=sagemaker_session,
    )
    with pytest.raises(
        NotImplementedError, match="Instance of Run type is not allowed to be pickled."
    ):
        cloudpickle.dumps(run_obj)


def test_log_parameter_outside_run_context(run_obj):
    with pytest.raises(RuntimeError) as err:
        run_obj.log_parameter("foo", "bar")
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_parameter(run_obj):
    with run_obj:
        run_obj.log_parameter("foo", "bar")
        assert run_obj._trial_component.parameters["foo"] == "bar"
        run_obj.log_parameter("whizz", 1)
        assert run_obj._trial_component.parameters["whizz"] == 1


def test_log_parameter_skip_invalid_value(run_obj):
    with run_obj:
        run_obj.log_parameter("key", nan)
        assert "key" not in run_obj._trial_component.parameters


def test_log_parameters_outside_run_context(run_obj):
    with pytest.raises(RuntimeError) as err:
        run_obj.log_parameters({"a": "b", "c": "d", "e": 5})
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_parameters(run_obj):
    with run_obj:
        run_obj.log_parameters({"a": "b", "c": "d", "e": 5})
        assert run_obj._trial_component.parameters == {"a": "b", "c": "d", "e": 5}


def test_log_parameters_skip_invalid_values(run_obj):
    with run_obj:
        run_obj.log_parameters({"a": "b", "c": "d", "e": 5, "f": nan})
        assert run_obj._trial_component.parameters == {"a": "b", "c": "d", "e": 5}


def test_log_input_outside_run_context(run_obj):
    with pytest.raises(RuntimeError) as err:
        run_obj.log_artifact("foo", "baz", "text/text", False)
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_input(run_obj):
    with run_obj:
        run_obj.log_artifact("foo", "baz", "text/text", False)
        assert run_obj._trial_component.input_artifacts == {
            "foo": TrialComponentArtifact(value="baz", media_type="text/text")
        }


def test_log_output_outside_run_context(run_obj):
    with pytest.raises(RuntimeError) as err:
        run_obj.log_artifact("foo", "baz", "text/text")
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_output(run_obj):
    with run_obj:
        run_obj.log_artifact("foo", "baz", "text/text")
        assert run_obj._trial_component.output_artifacts == {
            "foo": TrialComponentArtifact(value="baz", media_type="text/text")
        }


def test_log_metric_outside_run_context(run_obj):
    with pytest.raises(RuntimeError) as err:
        run_obj.log_metric(name="foo", value=1.0, step=1)
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_metric(run_obj):
    now = datetime.datetime.now()
    with run_obj:
        run_obj.log_metric(name="foo", value=1.0, step=1, timestamp=now)
        run_obj._metrics_manager.log_metric.assert_called_with(
            metric_name="foo", value=1.0, step=1, timestamp=now
        )


def test_log_metric_skip_invalid_value(run_obj):
    with run_obj:
        run_obj.log_metric(None, nan, None, None)
        assert not run_obj._metrics_manager.log_metric.called


def test_log_metric_attribute_error(run_obj):
    now = datetime.datetime.now()
    with run_obj:
        run_obj._metrics_manager.log_metric.side_effect = AttributeError

        with pytest.raises(AttributeError):
            run_obj.log_metric("foo", 1.0, 1, now)


def test_log_output_artifact_outside_run_context(run_obj):
    with pytest.raises(RuntimeError) as err:
        run_obj.log_file("foo.txt", "name", "whizz/bang")
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_output_artifact(run_obj):
    run_obj._artifact_uploader.upload_artifact.return_value = ("s3uri_value", "etag_value")
    with run_obj:
        run_obj.log_file("foo.txt", "name", "whizz/bang")
        run_obj._artifact_uploader.upload_artifact.assert_called_with("foo.txt")
        assert "whizz/bang" == run_obj._trial_component.output_artifacts["name"].media_type

        run_obj.log_file("foo.txt")
        run_obj._artifact_uploader.upload_artifact.assert_called_with("foo.txt")
        assert "foo.txt" in run_obj._trial_component.output_artifacts
        assert "text/plain" == run_obj._trial_component.output_artifacts["foo.txt"].media_type


def test_log_input_artifact_outside_run_context(run_obj):
    with pytest.raises(RuntimeError) as err:
        run_obj.log_file("foo.txt", "name", "whizz/bang", is_output=False)
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_input_artifact(run_obj):
    run_obj._artifact_uploader.upload_artifact.return_value = ("s3uri_value", "etag_value")
    with run_obj:
        run_obj.log_file("foo.txt", "name", "whizz/bang", is_output=False)
        run_obj._artifact_uploader.upload_artifact.assert_called_with("foo.txt")
        assert "whizz/bang" == run_obj._trial_component.input_artifacts["name"].media_type

        run_obj.log_file("foo.txt", is_output=False)
        run_obj._artifact_uploader.upload_artifact.assert_called_with("foo.txt")
        assert "foo.txt" in run_obj._trial_component.input_artifacts
        assert "text/plain" == run_obj._trial_component.input_artifacts["foo.txt"].media_type


def test_log_multiple_inputs(run_obj):
    with run_obj:
        for index in range(0, MAX_RUN_TC_ARTIFACTS_LEN):
            file_path = "foo" + str(index) + ".txt"
            run_obj._trial_component.input_artifacts[file_path] = {
                "foo": TrialComponentArtifact(value="baz" + str(index), media_type="text/text")
            }
        with pytest.raises(ValueError) as error:
            run_obj.log_artifact("foo.txt", "name", "whizz/bang", False)
        assert f"Cannot add more than {MAX_RUN_TC_ARTIFACTS_LEN} input_artifacts" in str(error)


def test_log_multiple_outputs(run_obj):
    with run_obj:
        for index in range(0, MAX_RUN_TC_ARTIFACTS_LEN):
            file_path = "foo" + str(index) + ".txt"
            run_obj._trial_component.output_artifacts[file_path] = {
                "foo": TrialComponentArtifact(value="baz" + str(index), media_type="text/text")
            }
        with pytest.raises(ValueError) as error:
            run_obj.log_artifact("foo.txt", "name", "whizz/bang")
        assert f"Cannot add more than {MAX_RUN_TC_ARTIFACTS_LEN} output_artifacts" in str(error)


def test_log_multiple_input_artifacts(run_obj):
    with run_obj:
        for index in range(0, MAX_RUN_TC_ARTIFACTS_LEN):
            file_path = "foo" + str(index) + ".txt"
            run_obj._artifact_uploader.upload_artifact.return_value = (
                "s3uri_value" + str(index),
                "etag_value" + str(index),
            )
            run_obj.log_file(
                file_path, "name" + str(index), "whizz/bang" + str(index), is_output=False
            )
            run_obj._artifact_uploader.upload_artifact.assert_called_with(file_path)

        run_obj._artifact_uploader.upload_artifact.return_value = (
            "s3uri_value",
            "etag_value",
        )

        # log an output artifact, should be fine
        run_obj.log_file("foo.txt", "name", "whizz/bang", is_output=True)

        # log an extra input artifact, should raise exception
        with pytest.raises(ValueError) as error:
            run_obj.log_file("foo.txt", "name", "whizz/bang", is_output=False)
        assert f"Cannot add more than {MAX_RUN_TC_ARTIFACTS_LEN} input_artifacts" in str(error)


def test_log_multiple_output_artifacts(run_obj):
    with run_obj:
        for index in range(0, MAX_RUN_TC_ARTIFACTS_LEN):
            file_path = "foo" + str(index) + ".txt"
            run_obj._artifact_uploader.upload_artifact.return_value = (
                "s3uri_value" + str(index),
                "etag_value" + str(index),
            )
            run_obj.log_file(file_path, "name" + str(index), "whizz/bang" + str(index))
            run_obj._artifact_uploader.upload_artifact.assert_called_with(file_path)

        run_obj._artifact_uploader.upload_artifact.return_value = (
            "s3uri_value",
            "etag_value",
        )

        # log an input artifact, should be fine
        run_obj.log_file("foo.txt", "name", "whizz/bang", is_output=False)

        # log an extra output artifact, should raise exception
        with pytest.raises(ValueError) as error:
            run_obj.log_file("foo.txt", "name", "whizz/bang")
        assert f"Cannot add more than {MAX_RUN_TC_ARTIFACTS_LEN} output_artifacts" in str(error)


def test_log_precision_recall_outside_run_context(run_obj):
    y_true = [0, 0, 1, 1]
    y_scores = [0.1, 0.4, 0.35, 0.8]
    no_skill = 0.1
    title = "TestPrecisionRecall"

    with pytest.raises(RuntimeError) as err:
        run_obj.log_precision_recall(
            y_true, y_scores, 0, title=title, no_skill=no_skill, is_output=False
        )
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_precision_recall(run_obj):
    y_true = [0, 0, 1, 1]
    y_scores = [0.1, 0.4, 0.35, 0.8]
    no_skill = 0.1
    title = "TestPrecisionRecall"

    run_obj._artifact_uploader.upload_object_artifact.return_value = (
        "s3uri_value",
        "etag_value",
    )
    with run_obj:
        run_obj.log_precision_recall(
            y_true, y_scores, 0, title=title, no_skill=no_skill, is_output=False
        )

        expected_data = {
            "type": "PrecisionRecallCurve",
            "version": 0,
            "title": title,
            "precision": [0.5, 0.3333333333333333, 0.5, 0.0, 1.0],
            "recall": [1.0, 0.5, 0.5, 0.0, 0.0],
            "averagePrecisionScore": 0.5,
            "noSkill": 0.1,
        }
        run_obj._artifact_uploader.upload_object_artifact.assert_called_with(
            title, expected_data, file_extension="json"
        )

        run_obj._lineage_artifact_tracker.add_input_artifact.assert_called_with(
            name=title,
            source_uri="s3uri_value",
            etag="etag_value",
            artifact_type="PrecisionRecallCurve",
        )


def test_log_precision_recall_invalid_input(run_obj):
    y_true = [0, 0, 1, 1]
    y_scores = [0.1, 0.4, 0.35]
    no_skill = 0.1

    with run_obj:
        with pytest.raises(ValueError) as error:
            run_obj.log_precision_recall(
                y_true, y_scores, 0, title="TestPrecisionRecall", no_skill=no_skill, is_output=False
            )
        assert "Lengths mismatch between true labels and predicted probabilities" in str(error)


def test_log_confusion_matrix_outside_run_context(run_obj):
    y_true = [2, 0, 2, 2, 0, 1]
    y_pred = [0, 0, 2, 2, 0, 2]

    with pytest.raises(RuntimeError) as err:
        run_obj.log_confusion_matrix(y_true, y_pred, title="TestConfusionMatrix")
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_confusion_matrix(run_obj):
    y_true = [2, 0, 2, 2, 0, 1]
    y_pred = [0, 0, 2, 2, 0, 2]

    run_obj._artifact_uploader.upload_object_artifact.return_value = (
        "s3uri_value",
        "etag_value",
    )
    with run_obj:
        run_obj.log_confusion_matrix(y_true, y_pred, title="TestConfusionMatrix")

        expected_data = {
            "type": "ConfusionMatrix",
            "version": 0,
            "title": "TestConfusionMatrix",
            "confusionMatrix": [[2, 0, 0], [0, 0, 1], [1, 0, 2]],
        }

        run_obj._artifact_uploader.upload_object_artifact.assert_called_with(
            "TestConfusionMatrix", expected_data, file_extension="json"
        )

        run_obj._lineage_artifact_tracker.add_output_artifact.assert_called_with(
            name="TestConfusionMatrix",
            source_uri="s3uri_value",
            etag="etag_value",
            artifact_type="ConfusionMatrix",
        )


def test_log_confusion_matrix_invalid_input(run_obj):
    y_true = [2, 0, 2, 2, 0, 1]
    y_pred = [0, 0, 2, 2, 0]

    with run_obj:
        with pytest.raises(ValueError) as error:
            run_obj.log_confusion_matrix(y_true, y_pred, title="TestConfusionMatrix")
        assert "Lengths mismatch between true labels and predicted labels" in str(error)


def test_log_roc_curve_outside_run_context(run_obj):
    y_true = [0, 0, 1, 1]
    y_scores = [0.1, 0.4, 0.35, 0.8]

    with pytest.raises(RuntimeError) as err:
        run_obj.log_roc_curve(y_true, y_scores, title="TestROCCurve", is_output=False)
    assert "This method should be called inside context of 'with' statement" in str(err)


def test_log_roc_curve(run_obj):
    y_true = [0, 0, 1, 1]
    y_scores = [0.1, 0.4, 0.35, 0.8]
    with run_obj:
        run_obj._artifact_uploader.upload_object_artifact.return_value = (
            "s3uri_value",
            "etag_value",
        )

        run_obj.log_roc_curve(y_true, y_scores, title="TestROCCurve", is_output=False)

        expected_data = {
            "type": "ROCCurve",
            "version": 0,
            "title": "TestROCCurve",
            "falsePositiveRate": [0.0, 0.0, 0.5, 0.5, 1.0],
            "truePositiveRate": [0.0, 0.5, 0.5, 1.0, 1.0],
            "areaUnderCurve": 0.75,
        }
        run_obj._artifact_uploader.upload_object_artifact.assert_called_with(
            "TestROCCurve", expected_data, file_extension="json"
        )

        run_obj._lineage_artifact_tracker.add_input_artifact.assert_called_with(
            name="TestROCCurve",
            source_uri="s3uri_value",
            etag="etag_value",
            artifact_type="ROCCurve",
        )


def test_log_roc_curve_invalid_input(run_obj):
    y_true = [0, 0, 1, 1]
    y_scores = [0.1, 0.4, 0.35]

    with run_obj:
        with pytest.raises(ValueError) as error:
            run_obj.log_roc_curve(y_true, y_scores, title="TestROCCurve", is_output=False)
        assert "Lengths mismatch between true labels and predicted scores" in str(error)


@patch(
    "sagemaker.experiments.run.Experiment._load_or_create",
    MagicMock(return_value=Experiment(experiment_name=TEST_EXP_NAME)),
)
@patch(
    "sagemaker.experiments.run._Trial._load_or_create",
    MagicMock(side_effect=mock_trial_load_or_create_func),
)
@patch.object(_Trial, "add_trial_component", MagicMock(return_value=None))
@patch("sagemaker.experiments.run._TrialComponent._load_or_create")
@patch("sagemaker.experiments.run._TrialComponent.list")
@patch("sagemaker.experiments.run._TrialComponent.search")
def test_list(mock_tc_search, mock_tc_list, mock_tc_load, run_obj, sagemaker_session):
    start_time = datetime.datetime.now(datetime.timezone.utc) + datetime.timedelta(hours=1)
    end_time = datetime.datetime.now(datetime.timezone.utc) + datetime.timedelta(hours=2)
    creation_time = datetime.datetime.now(datetime.timezone.utc) + datetime.timedelta(hours=3)
    last_modified_time = datetime.datetime.now(datetime.timezone.utc) + datetime.timedelta(hours=4)
    tc_list_len = 20
    tc_list_len_half = int(tc_list_len / 2)
    mock_tc_search.side_effect = [
        [
            TrialComponentSearchResult(
                trial_component_name=Run._generate_trial_component_name(
                    "a" + str(i), TEST_EXP_NAME
                ),
                trial_component_arn="b" + str(i),
                display_name="C" + str(i),
                creation_time=creation_time + datetime.timedelta(hours=i),
                last_modified_time=last_modified_time + datetime.timedelta(hours=i),
                last_modified_by={},
                tags=[RUN_TC_TAG] if i < tc_list_len_half else None,
            )
        ]
        for i in range(tc_list_len)
    ]
    mock_tc_list.return_value = [
        TrialComponentSummary(
            trial_component_name=Run._generate_trial_component_name(
                "A" + str(i), TEST_EXP_NAME_MIXED_CASE
            ),
            trial_component_arn="b" + str(i),
            display_name="C" + str(i),
            source_arn="D" + str(i),
            status=TrialComponentStatus(
                primary_status=_TrialComponentStatusType.InProgress.value, message="E" + str(i)
            ),
            start_time=start_time + datetime.timedelta(hours=i),
            end_time=end_time + datetime.timedelta(hours=i),
            creation_time=creation_time + datetime.timedelta(hours=i),
            last_modified_time=last_modified_time + datetime.timedelta(hours=i),
            last_modified_by={},
        )
        for i in range(tc_list_len)
    ]
    mock_tc_load.side_effect = [
        (
            _TrialComponent(
                trial_component_name=Run._generate_trial_component_name(
                    "a" + str(i), TEST_EXP_NAME_MIXED_CASE
                ),
                trial_component_arn="b" + str(i),
                display_name="C" + str(i),
                source_arn="D" + str(i),
                status=TrialComponentStatus(
                    primary_status=_TrialComponentStatusType.InProgress.value, message="E" + str(i)
                ),
                start_time=start_time + datetime.timedelta(hours=i),
                end_time=end_time + datetime.timedelta(hours=i),
                creation_time=creation_time + datetime.timedelta(hours=i),
                last_modified_time=last_modified_time + datetime.timedelta(hours=i),
                last_modified_by={},
            ),
            True,
        )
        for i in range(tc_list_len_half)
    ]

    run_list = list_runs(
        experiment_name=TEST_EXP_NAME_MIXED_CASE,
        sort_by=SortByType.CREATION_TIME,
        sort_order=SortOrderType.ASCENDING,
        sagemaker_session=sagemaker_session,
    )

    mock_tc_list.assert_called_once_with(
        experiment_name=TEST_EXP_NAME_MIXED_CASE,
        created_before=None,
        created_after=None,
        sort_by="CreationTime",
        sort_order="Ascending",
        sagemaker_session=sagemaker_session,
        max_results=None,
        next_token=None,
    )
    assert len(run_list) == tc_list_len_half
    for i in range(tc_list_len_half):
        run = run_list[i]
        assert run.experiment_name == TEST_EXP_NAME
        assert run.run_name == "a" + str(i)
        assert run._experiment
        assert run._trial
        assert isinstance(run._trial_component, _TrialComponent)
        assert run._trial_component.trial_component_name == Run._generate_trial_component_name(
            "a" + str(i), TEST_EXP_NAME
        )
        assert run._in_load is False
        assert run._inside_load_context is False
        assert run._inside_init_context is False
        assert run._artifact_uploader
        assert run._lineage_artifact_tracker
        assert run._metrics_manager


@patch("sagemaker.experiments.run._TrialComponent.list")
def test_list_empty(mock_tc_list, sagemaker_session):
    mock_tc_list.return_value = []
    assert [] == list_runs(experiment_name=TEST_EXP_NAME, sagemaker_session=sagemaker_session)


@patch(
    "sagemaker.experiments.run.Experiment._load_or_create",
    MagicMock(return_value=Experiment(experiment_name=TEST_EXP_NAME)),
)
@patch(
    "sagemaker.experiments.run._Trial._load_or_create",
    MagicMock(side_effect=mock_trial_load_or_create_func),
)
@patch.object(_Trial, "add_trial_component", MagicMock(return_value=None))
@patch("sagemaker.experiments.run._TrialComponent._load_or_create")
def test_enter_exit_locally(mock_load_tc, sagemaker_session, run_obj):
    mock_load_tc.return_value = run_obj._trial_component, False
    sagemaker_session.sagemaker_client.update_trial_component.return_value = {}
    _verify_tc_status_before_enter_init(run_obj._trial_component)

    with run_obj:
        _verify_tc_status_when_entering(run_obj._trial_component)
        init_start_time = run_obj._trial_component.start_time

        with load_run(sagemaker_session=sagemaker_session):
            _verify_tc_status_when_entering(
                trial_component=run_obj._trial_component,
                init_start_time=init_start_time,
            )

        old_end_time = _verify_tc_status_when_successfully_exit(
            trial_component=run_obj._trial_component,
        )

    old_end_time = _verify_tc_status_when_successfully_exit(
        trial_component=run_obj._trial_component,
        old_end_time=old_end_time,
    )

    # Re-load to verify:
    # 1. if it works when load_run and with are not in one line
    # 2. if re-entering the load will change the "Completed" TC status
    # to "InProgress"
    # 3. when exiting the load, the end_time and status will be overridden again
    run_load = load_run(
        experiment_name=run_obj.experiment_name,
        run_name=run_obj.run_name,
        sagemaker_session=sagemaker_session,
    )
    with run_load:
        _verify_tc_status_when_entering(
            trial_component=run_obj._trial_component,
            init_start_time=init_start_time,
            has_completed=True,
        )
    _verify_tc_status_when_successfully_exit(
        trial_component=run_obj._trial_component, old_end_time=old_end_time
    )


def test_exit_fail(sagemaker_session, run_obj):
    sagemaker_session.sagemaker_client.update_trial_component.return_value = {}
    try:
        with run_obj:
            raise ValueError("Foo")
    except ValueError:
        pass

    assert run_obj._trial_component.status.primary_status == _TrialComponentStatusType.Failed.value
    assert run_obj._trial_component.status.message
    assert isinstance(run_obj._trial_component.end_time, datetime.datetime)


@pytest.mark.parametrize(
    "metric_value",
    [1.3, "nan", "inf", "-inf", None],
)
def test_is_input_valid(run_obj, metric_value):
    assert run_obj._is_input_valid("metric", "Name", metric_value)


@pytest.mark.parametrize(
    "metric_value",
    [nan, inf, -inf],
)
def test_is_input_valid_false(run_obj, metric_value):
    assert not run_obj._is_input_valid("parameter", "Name", metric_value)


def test_generate_trial_name():
    base_name = "x" * MAX_NAME_LEN_IN_BACKEND
    trial_name = Run._generate_trial_name(base_name=base_name)
    assert len(trial_name) <= MAX_NAME_LEN_IN_BACKEND


def test_append_run_tc_label_to_tags():
    expected_tc_tag = RUN_TC_TAG

    tags = None
    ret = Run._append_run_tc_label_to_tags(tags)
    assert len(ret) == 1
    assert expected_tc_tag in ret

    tags = []
    ret = Run._append_run_tc_label_to_tags(tags)
    assert len(ret) == 1
    assert expected_tc_tag in ret

    tags = [{"Key": "foo", "Value": "bar"}]
    ret = Run._append_run_tc_label_to_tags(tags)
    assert len(ret) == 2
    assert expected_tc_tag in ret

    tags = [expected_tc_tag]
    ret = Run._append_run_tc_label_to_tags(tags)
    assert len(ret) == 1
    assert expected_tc_tag in ret


def _verify_tc_status_before_enter_init(trial_component):
    assert not trial_component.start_time
    assert not trial_component.end_time
    assert not trial_component.status


def _verify_tc_status_when_entering(trial_component, init_start_time=None, has_completed=False):
    if not init_start_time:
        assert isinstance(trial_component.start_time, datetime.datetime)
        now = datetime.datetime.now(dateutil.tz.tzlocal())
        assert (now.timestamp() - trial_component.start_time.timestamp()) < 1
    else:
        assert trial_component.start_time == init_start_time

    if not has_completed:
        assert not trial_component.end_time
    assert trial_component.status.primary_status == _TrialComponentStatusType.InProgress.value


def _verify_tc_status_when_successfully_exit(trial_component, old_end_time=None):
    assert trial_component.status.primary_status == _TrialComponentStatusType.Completed.value
    assert isinstance(trial_component.start_time, datetime.datetime)
    assert isinstance(trial_component.end_time, datetime.datetime)
    if old_end_time:
        assert trial_component.end_time > old_end_time
    return trial_component.end_time