# SPDX-License-Identifier: Apache-2.0
# The OpenSearch Contributors require contributions made to
# this file be licensed under the Apache-2.0 license or a
# compatible open source license.
# Any modifications Copyright OpenSearch Contributors. See
# GitHub history for details.

#  Licensed to Elasticsearch B.V. under one or more contributor
#  license agreements. See the NOTICE file distributed with
#  this work for additional information regarding copyright
#  ownership. Elasticsearch B.V. licenses this file to you under
#  the Apache License, Version 2.0 (the "License"); you may
#  not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
# 	http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing,
#  software distributed under the License is distributed on an
#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
#  KIND, either express or implied.  See the License for the
#  specific language governing permissions and limitations
#  under the License.

# File called _pytest for PyCharm compatability

import pytest

from tests.common import TestData


class TestDataFrameFilter(TestData):
    def test_filter_arguments_mutually_exclusive(self, df):
        with pytest.raises(TypeError):
            df.filter(items=[], like="!", regex="!")
        with pytest.raises(TypeError):
            df.filter(items=[], regex="!")
        with pytest.raises(TypeError):
            df.filter(items=[], like="!")
        with pytest.raises(TypeError):
            df.filter(like="!", regex="!")
        with pytest.raises(TypeError):
            df.filter()

    @pytest.mark.parametrize(
        "items",
        [
            ["DestCountry", "Cancelled", "AvgTicketPrice"],
            [],
            ["notfound", "AvgTicketPrice"],
        ],
    )
    def test_filter_columns_items(self, df, items):
        df.filter(items=items)

    @pytest.mark.parametrize("like", ["Flight", "Nope"])
    def test_filter_columns_like(self, df, like):
        df.filter(like=like)

    @pytest.mark.parametrize("regex", ["^Flig", "^Flight.*r$", ".*", "^[^C]"])
    def test_filter_columns_regex(self, df, regex):
        df.filter(regex=regex)

    def test_filter_index_items(self, df):
        # to properly test dropping of indices we must account for differently named indexes
        pd_filter_one = ["20"]
        pd_filter_many = [str(x) for x in range(30)]
        oml_index = df.oml.to_pandas().index
        oml_filter_one = [oml_index[20]]
        oml_filter_many = list(oml_index[:30])

        df.filter(items=[], axis=0)
        df.check_values(
            df.oml.filter(items=oml_filter_one, axis=0),
            df.pd.filter(items=pd_filter_one, axis=0),
        )
        df.check_values(
            df.oml.filter(items=oml_filter_many, axis=0),
            df.pd.filter(items=pd_filter_many, axis=0),
        )

    def test_filter_index_like_and_regex(self):
        oml_flights_small = self.oml_flights_small()

        with pytest.raises(NotImplementedError):
            oml_flights_small.filter(like="2", axis=0)
        with pytest.raises(NotImplementedError):
            oml_flights_small.filter(regex="^2", axis=0)

    def test_filter_index_order(self):
        # Filtering dataframe should retain order of items
        oml_flights = self.oml_flights()

        oml_index = oml_flights.to_pandas().index
        items = list(oml_index[:5])
        items.reverse()

        assert [
            i for i in oml_flights.filter(axis="index", items=items).to_pandas().index
        ] == items