#pragma once

#include "storm/solver/AbstractEquationSolver.h"
#include "storm/storage/BitVector.h"
#include "storm/storage/SparseMatrix.h"
#include "storm/storage/Scheduler.h"
#include "storm/storage/MaximalEndComponentDecomposition.h"
#include "storm/transformer/EndComponentEliminator.h"
#include "storm/modelchecker/helper/infinitehorizon/SparseNondeterministicInfiniteHorizonHelper.h"
#include "storm/modelchecker/helper/infinitehorizon/SparseDeterministicInfiniteHorizonHelper.h"
#include "storm/modelchecker/multiobjective/Objective.h"
#include "storm/modelchecker/multiobjective/pcaa/PcaaWeightVectorChecker.h"
#include "storm/modelchecker/multiobjective/preprocessing/SparseMultiObjectivePreprocessorResult.h"
#include "storm/utility/vector.h"
#include "storm/storage/BoostTypes.h"

namespace storm {
    namespace modelchecker {
        namespace multiobjective {
            
            /*!
             * Helper Class that takes preprocessed Pcaa data and a weight vector and ...
             * - computes the optimal expected reward w.r.t. the weighted sum of the rewards of the individual objectives
             * - extracts the scheduler that induces this optimum
             * - computes for each objective the value induced by this scheduler
             */
            template <class SparseModelType>
            class StandardPcaaWeightVectorChecker : public PcaaWeightVectorChecker<SparseModelType> {
            public:
                typedef typename SparseModelType::ValueType ValueType;
                using DeterministicInfiniteHorizonHelperType = typename std::conditional<std::is_same<SparseModelType, storm::models::sparse::MarkovAutomaton<ValueType>>::value,
                                                                        storm::modelchecker::helper::SparseNondeterministicInfiniteHorizonHelper<ValueType>,
                                                                        storm::modelchecker::helper::SparseDeterministicInfiniteHorizonHelper<ValueType>>::type;

                /*
                 * Creates a weight vextor checker.
                 *
                 * @param model The (preprocessed) model
                 * @param objectives The (preprocessed) objectives
                 * @param possibleECActions Overapproximation of the actions that are part of an EC
                 * @param possibleBottomStates The states for which it is posible to not collect further reward with prob. 1
                 *
                 */
                StandardPcaaWeightVectorChecker(preprocessing::SparseMultiObjectivePreprocessorResult<SparseModelType> const& preprocessorResult);
                
                /*!
                 * - computes the optimal expected reward w.r.t. the weighted sum of the rewards of the individual objectives
                 * - extracts the scheduler that induces this optimum
                 * - computes for each objective the value induced by this scheduler
                 */
                virtual void check(Environment const& env, std::vector<ValueType> const& weightVector) override;
                
                /*!
                 * Retrieves the results of the individual objectives at the initial state of the given model.
                 * Note that check(..) has to be called before retrieving results. Otherwise, an exception is thrown.
                 * Also note that there is no guarantee that the under/over approximation is in fact correct
                 * as long as the underlying solution methods are unsound (e.g., standard value iteration).
                 */
                virtual std::vector<ValueType> getUnderApproximationOfInitialStateResults() const override;
                virtual std::vector<ValueType> getOverApproximationOfInitialStateResults() const override;
                
                /*!
                 * Retrieves a scheduler that induces the current values
                 * Note that check(..) has to be called before retrieving the scheduler. Otherwise, an exception is thrown.
                 * Also note that (currently) the scheduler only supports unbounded objectives.
                 */
                virtual storm::storage::Scheduler<ValueType> computeScheduler() const override;
                
                
            protected:
                
                void initialize(preprocessing::SparseMultiObjectivePreprocessorResult<SparseModelType> const& preprocessorResult);
                virtual void initializeModelTypeSpecificData(SparseModelType const& model) = 0;
                virtual storm::modelchecker::helper::SparseNondeterministicInfiniteHorizonHelper<ValueType> createNondetInfiniteHorizonHelper(storm::storage::SparseMatrix<ValueType> const& transitions) const = 0;
                virtual DeterministicInfiniteHorizonHelperType createDetInfiniteHorizonHelper(storm::storage::SparseMatrix<ValueType> const& transitions) const = 0;

                void infiniteHorizonWeightedPhase(Environment const& env, std::vector<ValueType> const& weightedActionRewardVector, boost::optional<std::vector<ValueType>> const& weightedStateRewardVector);
                
                /*!
                 * Determines the scheduler that optimizes the weighted reward vector of the unbounded objectives
                 *
                 * @param weightedRewardVector the weighted rewards (only considering the unbounded objectives)
                 */
                void unboundedWeightedPhase(Environment const& env, std::vector<ValueType> const& weightedRewardVector, std::vector<ValueType> const& weightVector);
                
                /*!
                 * Computes the values of the objectives that do not have a stepBound w.r.t. the scheduler computed in the unboundedWeightedPhase
                 *
                 */
                void unboundedIndividualPhase(Environment const& env, std::vector<ValueType> const& weightVector);
                
                /*!
                 * For each time epoch (starting with the maximal stepBound occurring in the objectives), this method
                 * - determines the objectives that are relevant in the current time epoch
                 * - determines the maximizing scheduler for the weighted reward vector of these objectives
                 * - computes the values of these objectives w.r.t. this scheduler
                 *
                 * @param weightVector the weight vector of the current check
                 * @param weightedRewardVector the weighted rewards considering the unbounded objectives. Will be invalidated after calling this.
                 */
                virtual void boundedPhase(Environment const& env, std::vector<ValueType> const& weightVector, std::vector<ValueType>& weightedRewardVector) = 0;
                
                void updateEcQuotient(std::vector<ValueType> const& weightedRewardVector);
                
                
                void setBoundsToSolver(storm::solver::AbstractEquationSolver<ValueType>& solver, bool requiresLower, bool requiresUpper, uint64_t objIndex, storm::storage::SparseMatrix<ValueType> const& transitions, storm::storage::BitVector const& rowsWithSumLessOne, std::vector<ValueType> const& rewards) const;
                void setBoundsToSolver(storm::solver::AbstractEquationSolver<ValueType>& solver, bool requiresLower, bool requiresUpper, std::vector<ValueType> const& weightVector, storm::storage::BitVector const& objectiveFilter, storm::storage::SparseMatrix<ValueType> const& transitions, storm::storage::BitVector const& rowsWithSumLessOne, std::vector<ValueType> const& rewards) const;
                void computeAndSetBoundsToSolver(storm::solver::AbstractEquationSolver<ValueType>& solver, bool requiresLower, bool requiresUpper, storm::storage::SparseMatrix<ValueType> const& transitions, storm::storage::BitVector const& rowsWithSumLessOne, std::vector<ValueType> const& rewards) const;

                /*!
                 * Transforms the results of a min-max-solver that considers a reduced model (without end components) to a result for the original (unreduced) model
                 */
                void transformEcqSolutionToOriginalModel(std::vector<ValueType> const& ecqSolution,
                                                             std::vector<uint_fast64_t> const& ecqOptimalChoices,
                                                             std::map<uint64_t, uint64_t> const& ecqStateToOptimalMecMap,
                                                             std::vector<ValueType>& originalSolution,
                                                             std::vector<uint_fast64_t>& originalOptimalChoices) const;
                
                
                // Data regarding the given model
                // The transition matrix of the considered model
                storm::storage::SparseMatrix<ValueType> transitionMatrix;
                // The initial state of the considered model
                uint64_t initialState;
                // Overapproximation of the set of choices that are part of an end component.
                storm::storage::BitVector ecChoicesHint;
                // The actions that have reward assigned for at least one objective without upper timeBound
                storm::storage::BitVector actionsWithoutRewardInUnboundedPhase;
                // The states for which there is a scheduler yielding reward 0 for each total reward objective
                storm::storage::BitVector totalReward0EStates;
                // stores the state action rewards for each objective.
                std::vector<std::vector<ValueType>> actionRewards;
                // stores the state rewards for each objective.
                // These are only relevant for LRA objectives for MAs (otherwise, they appear within the action rewards). For other objectives/models, the corresponding vector will be empty.
                std::vector<std::vector<ValueType>> stateRewards;
                
                // stores the indices of the objectives for which we need to compute the long run average values
                storm::storage::BitVector lraObjectives;
                // stores the indices of the objectives for which there is no upper time bound
                storm::storage::BitVector objectivesWithNoUpperTimeBound;
                
                // Memory for the solution of the most recent call of check(..)
                // becomes true after the first call of check(..)
                bool checkHasBeenCalled;
                // The result for the weighted reward vector (for all states of the model)
                std::vector<ValueType> weightedResult;
                // The results for the individual objectives (w.r.t. all states of the model)
                std::vector<std::vector<ValueType>> objectiveResults;
                // Stores for each objective the distance between the computed result (w.r.t. the initial state) and an over/under approximation for the actual result.
                // The distances are stored as a (possibly negative) offset that has to be added (+) to to the objectiveResults.
                std::vector<ValueType> offsetsToUnderApproximation;
                std::vector<ValueType> offsetsToOverApproximation;
                // The scheduler choices that optimize the weighted rewards of undounded objectives.
                std::vector<uint64_t> optimalChoices;
                
                struct EcQuotient {
                    storm::storage::SparseMatrix<ValueType> matrix;
                    std::vector<uint_fast64_t> ecqToOriginalChoiceMapping;
                    std::vector<uint_fast64_t> originalToEcqStateMapping;
                    std::vector<storm::storage::FlatSetStateContainer> ecqToOriginalStateMapping;
                    storm::storage::BitVector ecqStayInEcChoices;
                    storm::storage::BitVector origReward0Choices; // includes total and LRA rewards
                    storm::storage::BitVector origTotalReward0Choices; // considers just total rewards
                    storm::storage::BitVector rowsWithSumLessOne;
                    
                    std::vector<ValueType> auxStateValues;
                    std::vector<ValueType> auxChoiceValues;
                };
                boost::optional<EcQuotient> ecQuotient;
                
                struct LraMecDecomposition {
                    storm::storage::MaximalEndComponentDecomposition<ValueType> mecs;
                    std::vector<ValueType> auxMecValues;
                };
                boost::optional<LraMecDecomposition> lraMecDecomposition;
                
            };
            
        }
    }
}