from __future__ import annotations

from collections.abc import Callable
from collections.abc import Sequence
from typing import Any
import warnings

from _pytest.mark.structures import MarkDecorator
import numpy as np
import pytest

import optuna
from optuna.distributions import BaseDistribution
from optuna.distributions import CategoricalChoiceType
from optuna.distributions import CategoricalDistribution
from optuna.distributions import FloatDistribution
from optuna.distributions import IntDistribution
from optuna.samplers import BaseSampler
from optuna.study import Study
from optuna.trial import FrozenTrial
from optuna.trial import Trial
from optuna.trial import TrialState


def parametrize_suggest_method(name: str) -> MarkDecorator:
    return pytest.mark.parametrize(
        f"suggest_method_{name}",
        [
            lambda t: t.suggest_float(name, 0, 10),
            lambda t: t.suggest_int(name, 0, 10),
            lambda t: t.suggest_categorical(name, [0, 1, 2]),
            lambda t: t.suggest_float(name, 0, 10, step=0.5),
            lambda t: t.suggest_float(name, 1e-7, 10, log=True),
            lambda t: t.suggest_int(name, 1, 10, log=True),
        ],
    )


def _create_new_trial(study: Study) -> FrozenTrial:
    trial_id = study._storage.create_new_trial(study._study_id)
    return study._storage.get_trial(trial_id)


class FixedSampler(BaseSampler):
    def __init__(
        self,
        relative_search_space: dict[str, BaseDistribution],
        relative_params: dict[str, Any],
        unknown_param_value: Any,
    ) -> None:
        self.relative_search_space = relative_search_space
        self.relative_params = relative_params
        self.unknown_param_value = unknown_param_value

    def infer_relative_search_space(
        self, study: Study, trial: FrozenTrial
    ) -> dict[str, BaseDistribution]:
        return self.relative_search_space

    def sample_relative(
        self, study: Study, trial: FrozenTrial, search_space: dict[str, BaseDistribution]
    ) -> dict[str, Any]:
        return self.relative_params

    def sample_independent(
        self,
        study: Study,
        trial: FrozenTrial,
        param_name: str,
        param_distribution: BaseDistribution,
    ) -> Any:
        return self.unknown_param_value


class _BaseSamplerTestCase:
    @pytest.fixture
    def sampler(self) -> Callable[[], BaseSampler]:
        raise NotImplementedError


class BasicSamplerTestCase(_BaseSamplerTestCase):
    @pytest.mark.parametrize(
        "distribution",
        [
            FloatDistribution(-1.0, 1.0),
            FloatDistribution(0.0, 1.0),
            FloatDistribution(-1.0, 0.0),
            FloatDistribution(1e-7, 1.0, log=True),
            FloatDistribution(-10, 10, step=0.1),
            FloatDistribution(-10.2, 10.2, step=0.1),
        ],
    )
    def test_float(
        self,
        sampler: Callable[[], BaseSampler],
        distribution: FloatDistribution,
    ) -> None:
        study = optuna.study.create_study(sampler=sampler())
        points = np.array(
            [
                study.sampler.sample_independent(
                    study, _create_new_trial(study), "x", distribution
                )
                for _ in range(100)
            ]
        )
        assert np.all(points >= distribution.low)
        assert np.all(points <= distribution.high)
        assert not isinstance(
            study.sampler.sample_independent(study, _create_new_trial(study), "x", distribution),
            np.floating,
        )

        if distribution.step is not None:
            # Check all points are multiples of distribution.step.
            points -= distribution.low
            points /= distribution.step
            round_points = np.round(points)
            np.testing.assert_almost_equal(round_points, points)

    @pytest.mark.parametrize(
        "distribution",
        [
            IntDistribution(-10, 10),
            IntDistribution(0, 10),
            IntDistribution(-10, 0),
            IntDistribution(-10, 10, step=2),
            IntDistribution(0, 10, step=2),
            IntDistribution(-10, 0, step=2),
            IntDistribution(1, 100, log=True),
        ],
    )
    def test_int(self, sampler: Callable[[], BaseSampler], distribution: IntDistribution) -> None:
        study = optuna.study.create_study(sampler=sampler())
        points = np.array(
            [
                study.sampler.sample_independent(
                    study, _create_new_trial(study), "x", distribution
                )
                for _ in range(100)
            ]
        )
        assert np.all(points >= distribution.low)
        assert np.all(points <= distribution.high)
        assert not isinstance(
            study.sampler.sample_independent(study, _create_new_trial(study), "x", distribution),
            np.integer,
        )

    @pytest.mark.parametrize("choices", [(1, 2, 3), ("a", "b", "c"), (1, "a")])
    def test_categorical(
        self, sampler: Callable[[], BaseSampler], choices: Sequence[CategoricalChoiceType]
    ) -> None:
        distribution = CategoricalDistribution(choices)

        study = optuna.study.create_study(sampler=sampler())

        def sample() -> float:
            trial = _create_new_trial(study)
            param_value = study.sampler.sample_independent(study, trial, "x", distribution)
            return float(distribution.to_internal_repr(param_value))

        points = np.asarray([sample() for i in range(100)])

        # 'x' value is corresponding to an index of distribution.choices.
        assert np.all(points >= 0)
        assert np.all(points <= len(distribution.choices) - 1)
        round_points = np.round(points)
        np.testing.assert_almost_equal(round_points, points)

    def test_conditional_sample_independent(self, sampler: Callable[[], BaseSampler]) -> None:
        # This test case reproduces the error reported in #2734.
        # See https://github.com/optuna/optuna/pull/2734#issuecomment-857649769.

        study = optuna.study.create_study(sampler=sampler())
        categorical_distribution = CategoricalDistribution(choices=["x", "y"])
        dependent_distribution = CategoricalDistribution(choices=["a", "b"])

        study.add_trial(
            optuna.create_trial(
                params={"category": "x", "x": "a"},
                distributions={"category": categorical_distribution, "x": dependent_distribution},
                value=0.1,
            )
        )

        study.add_trial(
            optuna.create_trial(
                params={"category": "y", "y": "b"},
                distributions={"category": categorical_distribution, "y": dependent_distribution},
                value=0.1,
            )
        )

        _trial = _create_new_trial(study)
        category = study.sampler.sample_independent(
            study, _trial, "category", categorical_distribution
        )
        assert category in ["x", "y"]
        value = study.sampler.sample_independent(study, _trial, category, dependent_distribution)
        assert value in ["a", "b"]

    def test_nan_objective_value(self, sampler: Callable[[], BaseSampler]) -> None:
        study = optuna.create_study(sampler=sampler())

        def objective(trial: Trial, base_value: float) -> float:
            return trial.suggest_float("x", 0.1, 0.2) + base_value

        # Non NaN objective values.
        for i in range(10, 1, -1):
            study.optimize(lambda t: objective(t, i), n_trials=1, catch=())
        assert int(study.best_value) == 2

        # NaN objective values.
        study.optimize(lambda t: objective(t, float("nan")), n_trials=1, catch=())
        assert int(study.best_value) == 2

        # Non NaN objective value.
        study.optimize(lambda t: objective(t, 1), n_trials=1, catch=())
        assert int(study.best_value) == 1

    def test_partial_fixed_sampling(self, sampler: Callable[[], BaseSampler]) -> None:
        study = optuna.create_study(sampler=sampler())

        def objective(trial: Trial) -> float:
            x = trial.suggest_float("x", -1, 1)
            y = trial.suggest_int("y", -1, 1)
            z = trial.suggest_float("z", -1, 1)
            return x + y + z

        # First trial.
        study.optimize(objective, n_trials=1)

        # Second trial. Here, the parameter ``y`` is fixed as 0.
        fixed_params = {"y": 0}
        with warnings.catch_warnings():
            warnings.simplefilter("ignore", optuna.exceptions.ExperimentalWarning)
            study.sampler = optuna.samplers.PartialFixedSampler(fixed_params, study.sampler)
        study.optimize(objective, n_trials=1)
        trial_params = study.trials[-1].params
        assert trial_params["y"] == fixed_params["y"]

    def test_sample_single_distribution(self, sampler: Callable[[], BaseSampler]) -> None:
        relative_search_space = {
            "a": CategoricalDistribution([1]),
            "b": IntDistribution(low=1, high=1),
            "c": IntDistribution(low=1, high=1, log=True),
            "d": FloatDistribution(low=1.0, high=1.0),
            "e": FloatDistribution(low=1.0, high=1.0, log=True),
            "f": FloatDistribution(low=1.0, high=1.0, step=1.0),
        }

        with warnings.catch_warnings():
            warnings.simplefilter("ignore", optuna.exceptions.ExperimentalWarning)
            sampler_ = sampler()
        study = optuna.study.create_study(sampler=sampler_)

        # We need to test the construction of the model, so we should set `n_trials >= 2`.
        for _ in range(2):
            trial = study.ask(fixed_distributions=relative_search_space)
            study.tell(trial, 1.0)
            for param_name in relative_search_space.keys():
                assert trial.params[param_name] == 1

    @parametrize_suggest_method("x")
    def test_single_parameter_objective(
        self, sampler: Callable[[], BaseSampler], suggest_method_x: Callable[[Trial], float]
    ) -> None:
        def objective(trial: Trial) -> float:
            return suggest_method_x(trial)

        with warnings.catch_warnings():
            warnings.simplefilter("ignore", optuna.exceptions.ExperimentalWarning)
            sampler_ = sampler()

        study = optuna.study.create_study(sampler=sampler_)
        study.optimize(objective, n_trials=10)

        assert len(study.trials) == 10
        assert all(t.state == TrialState.COMPLETE for t in study.trials)

    def test_conditional_parameter_objective(self, sampler: Callable[[], BaseSampler]) -> None:
        def objective(trial: Trial) -> float:
            x = trial.suggest_categorical("x", [True, False])
            if x:
                return trial.suggest_float("y", 0, 1)
            return trial.suggest_float("z", 0, 1)

        with warnings.catch_warnings():
            warnings.simplefilter("ignore", optuna.exceptions.ExperimentalWarning)
            sampler_ = sampler()

        study = optuna.study.create_study(sampler=sampler_)
        study.optimize(objective, n_trials=10)

        assert len(study.trials) == 10
        assert all(t.state == TrialState.COMPLETE for t in study.trials)

    @parametrize_suggest_method("x")
    @parametrize_suggest_method("y")
    def test_combination_of_different_distributions_objective(
        self,
        sampler: Callable[[], BaseSampler],
        suggest_method_x: Callable[[Trial], float],
        suggest_method_y: Callable[[Trial], float],
    ) -> None:
        def objective(trial: Trial) -> float:
            return suggest_method_x(trial) + suggest_method_y(trial)

        with warnings.catch_warnings():
            warnings.simplefilter("ignore", optuna.exceptions.ExperimentalWarning)
            sampler_ = sampler()

        study = optuna.study.create_study(sampler=sampler_)
        study.optimize(objective, n_trials=3)

        assert len(study.trials) == 3
        assert all(t.state == TrialState.COMPLETE for t in study.trials)

    @pytest.mark.parametrize(
        "second_low,second_high",
        [
            (0, 5),  # Narrow range.
            (0, 20),  # Expand range.
            (20, 30),  # Set non-overlapping range.
        ],
    )
    def test_dynamic_range_objective(
        self, sampler: Callable[[], BaseSampler], second_low: int, second_high: int
    ) -> None:
        def objective(trial: Trial, low: int, high: int) -> float:
            v = trial.suggest_float("x", low, high)
            v += trial.suggest_int("y", low, high)
            return v

        with warnings.catch_warnings():
            warnings.simplefilter("ignore", optuna.exceptions.ExperimentalWarning)
            sampler_ = sampler()

        study = optuna.study.create_study(sampler=sampler_)
        study.optimize(lambda t: objective(t, 0, 10), n_trials=10)
        study.optimize(lambda t: objective(t, second_low, second_high), n_trials=10)

        assert len(study.trials) == 20
        assert all(t.state == TrialState.COMPLETE for t in study.trials)


class RelativeSamplerTestCase(_BaseSamplerTestCase):
    @pytest.mark.parametrize(
        "x_distribution",
        [
            FloatDistribution(-1.0, 1.0),
            FloatDistribution(1e-7, 1.0, log=True),
            FloatDistribution(-10, 10, step=0.5),
            IntDistribution(3, 10),
            IntDistribution(1, 100, log=True),
            IntDistribution(3, 9, step=2),
        ],
    )
    @pytest.mark.parametrize(
        "y_distribution",
        [
            FloatDistribution(-1.0, 1.0),
            FloatDistribution(1e-7, 1.0, log=True),
            FloatDistribution(-10, 10, step=0.5),
            IntDistribution(3, 10),
            IntDistribution(1, 100, log=True),
            IntDistribution(3, 9, step=2),
        ],
    )
    def test_sample_relative_numerical(
        self,
        sampler: Callable[[], BaseSampler],
        x_distribution: BaseDistribution,
        y_distribution: BaseDistribution,
    ) -> None:
        search_space: dict[str, BaseDistribution] = dict(x=x_distribution, y=y_distribution)
        study = optuna.study.create_study(sampler=sampler())
        trial = study.ask(search_space)
        study.tell(trial, sum(trial.params.values()))

        def sample() -> list[int | float]:
            params = study.sampler.sample_relative(study, _create_new_trial(study), search_space)
            return [params[name] for name in search_space]

        points = np.array([sample() for _ in range(10)])
        for i, distribution in enumerate(search_space.values()):
            assert isinstance(
                distribution,
                (
                    FloatDistribution,
                    IntDistribution,
                ),
            )
            assert np.all(points[:, i] >= distribution.low)
            assert np.all(points[:, i] <= distribution.high)
        for param_value, distribution in zip(sample(), search_space.values()):
            assert not isinstance(param_value, np.floating)
            assert not isinstance(param_value, np.integer)
            if isinstance(distribution, IntDistribution):
                assert isinstance(param_value, int)
            else:
                assert isinstance(param_value, float)

    def test_sample_relative_categorical(self, sampler: Callable[[], BaseSampler]) -> None:
        search_space: dict[str, BaseDistribution] = dict(
            x=CategoricalDistribution([1, 10, 100]), y=CategoricalDistribution([-1, -10, -100])
        )
        study = optuna.study.create_study(sampler=sampler())
        trial = study.ask(search_space)
        study.tell(trial, sum(trial.params.values()))

        def sample() -> list[float]:
            params = study.sampler.sample_relative(study, _create_new_trial(study), search_space)
            return [params[name] for name in search_space]

        points = np.array([sample() for _ in range(10)])
        for i, distribution in enumerate(search_space.values()):
            assert isinstance(distribution, CategoricalDistribution)
            assert np.all([v in distribution.choices for v in points[:, i]])
        for param_value in sample():
            assert not isinstance(param_value, np.floating)
            assert not isinstance(param_value, np.integer)
            assert isinstance(param_value, int)

    @pytest.mark.parametrize(
        "x_distribution",
        [
            FloatDistribution(-1.0, 1.0),
            FloatDistribution(1e-7, 1.0, log=True),
            FloatDistribution(-10, 10, step=0.5),
            IntDistribution(1, 10),
            IntDistribution(1, 100, log=True),
        ],
    )
    def test_sample_relative_mixed(
        self, sampler: Callable[[], BaseSampler], x_distribution: BaseDistribution
    ) -> None:
        search_space: dict[str, BaseDistribution] = dict(
            x=x_distribution, y=CategoricalDistribution([-1, -10, -100])
        )
        study = optuna.study.create_study(sampler=sampler())
        trial = study.ask(search_space)
        study.tell(trial, sum(trial.params.values()))

        def sample() -> list[float]:
            params = study.sampler.sample_relative(study, _create_new_trial(study), search_space)
            return [params[name] for name in search_space]

        points = np.array([sample() for _ in range(10)])
        assert isinstance(
            search_space["x"],
            (
                FloatDistribution,
                IntDistribution,
            ),
        )
        assert np.all(points[:, 0] >= search_space["x"].low)
        assert np.all(points[:, 0] <= search_space["x"].high)
        assert isinstance(search_space["y"], CategoricalDistribution)
        assert np.all([v in search_space["y"].choices for v in points[:, 1]])
        for param_value, distribution in zip(sample(), search_space.values()):
            assert not isinstance(param_value, np.floating)
            assert not isinstance(param_value, np.integer)
            if isinstance(
                distribution,
                (
                    IntDistribution,
                    CategoricalDistribution,
                ),
            ):
                assert isinstance(param_value, int)
            else:
                assert isinstance(param_value, float)

    @pytest.mark.parametrize("n_jobs", [1, 2])
    def test_trial_relative_params(self, n_jobs: int, sampler: Callable[[], BaseSampler]) -> None:
        # TODO(nabenabe): Consider moving this test to study.
        sampler_ = sampler()
        study = optuna.study.create_study(sampler=sampler_)

        def objective(trial: Trial) -> float:
            assert trial._relative_params is None

            trial.suggest_float("x", -10, 10)
            trial.suggest_float("y", -10, 10)
            assert trial._relative_params is not None
            return -1

        study.optimize(objective, n_trials=10, n_jobs=n_jobs)


class MultiObjectiveSamplerTestCase(_BaseSamplerTestCase):
    @pytest.mark.parametrize(
        "distribution",
        [
            FloatDistribution(-1.0, 1.0),
            FloatDistribution(0.0, 1.0),
            FloatDistribution(-1.0, 0.0),
            FloatDistribution(1e-7, 1.0, log=True),
            FloatDistribution(-10, 10, step=0.1),
            FloatDistribution(-10.2, 10.2, step=0.1),
            IntDistribution(-10, 10),
            IntDistribution(0, 10),
            IntDistribution(-10, 0),
            IntDistribution(-10, 10, step=2),
            IntDistribution(0, 10, step=2),
            IntDistribution(-10, 0, step=2),
            IntDistribution(1, 100, log=True),
            CategoricalDistribution((1, 2, 3)),
            CategoricalDistribution(("a", "b", "c")),
            CategoricalDistribution((1, "a")),
        ],
    )
    def test_multi_objective_sample_independent(
        self,
        sampler: Callable[[], BaseSampler],
        distribution: BaseDistribution,
    ) -> None:
        study = optuna.study.create_study(directions=["minimize", "maximize"], sampler=sampler())
        for i in range(100):
            value = study.sampler.sample_independent(
                study, _create_new_trial(study), "x", distribution
            )
            assert distribution._contains(distribution.to_internal_repr(value))

            if not isinstance(distribution, CategoricalDistribution):
                # Please see https://github.com/optuna/optuna/pull/393 why this assertion
                # is needed.
                assert not isinstance(value, np.floating)

            if isinstance(distribution, FloatDistribution):
                if distribution.step is not None:
                    # Check the value is a multiple of `distribution.step` which is
                    # the quantization interval of the distribution.
                    value -= distribution.low
                    value /= distribution.step
                    round_value = np.round(value)
                    np.testing.assert_almost_equal(round_value, value)


class SingleOnlySamplerTestCase(_BaseSamplerTestCase):
    def test_raise_error_for_samplers_during_multi_objectives(
        self,
        sampler: Callable[[], BaseSampler],
    ) -> None:
        study = optuna.study.create_study(directions=["maximize", "maximize"], sampler=sampler())

        distribution = FloatDistribution(0.0, 1.0)
        with pytest.raises(ValueError):
            study.sampler.sample_independent(study, _create_new_trial(study), "x", distribution)

        with pytest.raises(ValueError):
            trial = _create_new_trial(study)
            study.sampler.sample_relative(
                study, trial, study.sampler.infer_relative_search_space(study, trial)
            )