better lower/upper result bounds

7 years ago · c9beea4f33
7 changed files with 143 additions and 57 deletions
--- a/src/storm/modelchecker/multiobjective/SparseMultiObjectivePreprocessor.cpp
+++ b/src/storm/modelchecker/multiobjective/SparseMultiObjectivePreprocessor.cpp
@ -530,46 +530,6 @@ namespace storm {
                    auto const& rewModel = result.preprocessedModel->getRewardModel(result.objectives[objIndex].formula->asRewardOperatorFormula().getRewardModelName());
                    auto actionRewards = rewModel.getTotalRewardVector(transitions);
                    // TODO: Consider cumulative reward formulas less naively
                    if (result.objectives[objIndex].formula->getSubformula().isCumulativeRewardFormula()) {
                        auto const& cumulativeRewardFormula = result.objectives[objIndex].formula->getSubformula().asCumulativeRewardFormula();
                        ValueType rewardBound = cumulativeRewardFormula.template getBound<ValueType>();
                        if (cumulativeRewardFormula.getTimeBoundReference().isRewardBound()) {
                            auto const& costModel = result.preprocessedModel->getRewardModel(cumulativeRewardFormula.getTimeBoundReference().getRewardName());
                            if (!costModel.hasTransitionRewards()) {
                                auto actionCosts = costModel.getTotalRewardVector(transitions);
                                typename  SparseModelType::ValueType largestRewardPerCost = storm::utility::zero<typename SparseModelType::ValueType>();
                                bool isFinite = true;
                                for (auto rewIt = actionRewards.begin(), costIt = actionCosts.begin(); rewIt != actionRewards.end(); ++rewIt, ++costIt) {
                                    if (!storm::utility::isZero(*rewIt)) {
                                        if (storm::utility::isZero(*costIt)) {
                                            isFinite = false;
                                            break;
                                        }
                                        ValueType rewardPerCost = *rewIt / *costIt;
                                        largestRewardPerCost = std::max(largestRewardPerCost, rewardPerCost);
                                    }
                                }
                                if (isFinite) {
                                    ValueType newResultBound = largestRewardPerCost * rewardBound;
                                    if (upperBound) {
                                        upperBound = std::min(upperBound.get(), newResultBound);
                                    } else {
                                        upperBound = newResultBound;
                                    }
                                }
                            }
                        } else {
                            ValueType newResultBound = (*std::max_element(actionRewards.begin(), actionRewards.end())) * rewardBound;
                            if (upperBound) {
                                upperBound = std::min(upperBound.get(), newResultBound);
                            } else {
                                upperBound = newResultBound;
                            }
                        }
                    }
                    if (result.objectives[objIndex].formula->getSubformula().isTotalRewardFormula() || result.objectives[objIndex].formula->getSubformula().isCumulativeRewardFormula()) {
                        // We have to eliminate ECs here to treat zero-reward ECs
@ -590,11 +550,21 @@ namespace storm {
                        rew0StateProbs.reserve(ecElimRes.matrix.getRowCount());
                        for (uint64_t state = 0; state < allStates.size(); ++ state) {
                            for (uint64_t choice = ecElimRes.matrix.getRowGroupIndices()[state]; choice < ecElimRes.matrix.getRowGroupIndices()[state + 1]; ++choice) {
                                ValueType outProb = storm::utility::one<ValueType>() - ecElimRes.matrix.getRowSum(choice);
                                if (!storm::utility::isZero(outProb)) {
                                    outStates.set(state, true);
                                // Check whether the choice lead to a state with expRew 0 in the original model
                                bool isOutChoice = false;
                                uint64_t originalModelChoice = ecElimRes.newToOldRowMapping[choice];
                                for (auto const& entry : transitions.getRow(originalModelChoice)) {
                                    if (!expRewGreater0EStates.get(entry.getColumn())) {
                                        isOutChoice = true;
                                        outStates.set(state, true);
                                        rew0StateProbs.push_back(storm::utility::one<ValueType>() - ecElimRes.matrix.getRowSum(choice));
                                        assert (!storm::utility::isZero(rew0StateProbs.back()));
                                        break;
                                    }
                                }
                                if (!isOutChoice) {
                                    rew0StateProbs.push_back(storm::utility::zero<ValueType>());
                                }
                                rew0StateProbs.push_back(outProb);
                            }
                        }
--- a/src/storm/modelchecker/multiobjective/pcaa/SparseMdpRewardBoundedPcaaWeightVectorChecker.cpp
+++ b/src/storm/modelchecker/multiobjective/pcaa/SparseMdpRewardBoundedPcaaWeightVectorChecker.cpp
@ -34,6 +34,12 @@ namespace storm {
                STORM_LOG_THROW(preprocessorResult.rewardFinitenessType == SparseMultiObjectivePreprocessorResult<SparseMdpModelType>::RewardFinitenessType::AllFinite, storm::exceptions::NotSupportedException, "There is a scheduler that yields infinite reward for one  objective. This is not supported.");
                STORM_LOG_THROW(preprocessorResult.preprocessedModel->getInitialStates().getNumberOfSetBits() == 1, storm::exceptions::NotSupportedException, "The model has multiple initial states.");
                // Update the objective bounds with what the reward unfolding can compute
                for (uint64_t objIndex = 0; objIndex < this->objectives.size(); ++objIndex) {
                    this->objectives[objIndex].lowerResultBound = rewardUnfolding.getLowerObjectiveBound(objIndex);
                    this->objectives[objIndex].upperResultBound = rewardUnfolding.getUpperObjectiveBound(objIndex);
                }
                numCheckedEpochs = 0;
                numChecks = 0;
            }
--- a/src/storm/modelchecker/prctl/SparseMdpPrctlModelChecker.cpp
+++ b/src/storm/modelchecker/prctl/SparseMdpPrctlModelChecker.cpp
@ -67,7 +67,7 @@ namespace storm {
                }
                auto formula = std::make_shared<storm::logic::ProbabilityOperatorFormula>(checkTask.getFormula().asSharedPointer(), opInfo);
                helper::rewardbounded::MultiDimensionalRewardUnfolding<ValueType, true> rewardUnfolding(this->getModel(), formula);
                auto numericResult = storm::modelchecker::helper::SparseMdpPrctlHelper<ValueType>::computeRewardBoundedValues(helper::SolutionType::UntilProbabilities, checkTask.getOptimizationDirection(), rewardUnfolding, this->getModel().getInitialStates(), *minMaxLinearEquationSolverFactory);
                auto numericResult = storm::modelchecker::helper::SparseMdpPrctlHelper<ValueType>::computeRewardBoundedValues(checkTask.getOptimizationDirection(), rewardUnfolding, this->getModel().getInitialStates(), *minMaxLinearEquationSolverFactory);
                return std::unique_ptr<CheckResult>(new ExplicitQuantitativeCheckResult<ValueType>(std::move(numericResult)));
            } else {
                STORM_LOG_THROW(!pathFormula.hasLowerBound() && pathFormula.hasUpperBound(), storm::exceptions::InvalidPropertyException, "Formula needs to have single upper time bound.");
@ -146,7 +146,7 @@ namespace storm {
                }
                auto formula = std::make_shared<storm::logic::RewardOperatorFormula>(checkTask.getFormula().asSharedPointer(), checkTask.getRewardModel(), opInfo);
                helper::rewardbounded::MultiDimensionalRewardUnfolding<ValueType, true> rewardUnfolding(this->getModel(), formula);
                auto numericResult = storm::modelchecker::helper::SparseMdpPrctlHelper<ValueType>::computeRewardBoundedValues(helper::SolutionType::ExpectedRewards, checkTask.getOptimizationDirection(), rewardUnfolding, this->getModel().getInitialStates(), *minMaxLinearEquationSolverFactory);
                auto numericResult = storm::modelchecker::helper::SparseMdpPrctlHelper<ValueType>::computeRewardBoundedValues(checkTask.getOptimizationDirection(), rewardUnfolding, this->getModel().getInitialStates(), *minMaxLinearEquationSolverFactory);
                return std::unique_ptr<CheckResult>(new ExplicitQuantitativeCheckResult<ValueType>(std::move(numericResult)));
            } else {
--- a/src/storm/modelchecker/prctl/helper/SparseMdpPrctlHelper.cpp
+++ b/src/storm/modelchecker/prctl/helper/SparseMdpPrctlHelper.cpp
@ -134,7 +134,7 @@ namespace storm {
            }
            template<typename ValueType>
            std::vector<ValueType> analyzeNonTrivialEpochModel(OptimizationDirection dir, typename rewardbounded::MultiDimensionalRewardUnfolding<ValueType, true>::EpochModel& epochModel, std::vector<ValueType>& x, std::vector<ValueType>& b, std::unique_ptr<storm::solver::MinMaxLinearEquationSolver<ValueType>>& minMaxSolver, storm::solver::MinMaxLinearEquationSolverFactory<ValueType> const& minMaxLinearEquationSolverFactory, ValueType const& precision, SolutionType const& type) {
            std::vector<ValueType> analyzeNonTrivialEpochModel(OptimizationDirection dir, typename rewardbounded::MultiDimensionalRewardUnfolding<ValueType, true>::EpochModel& epochModel, std::vector<ValueType>& x, std::vector<ValueType>& b, std::unique_ptr<storm::solver::MinMaxLinearEquationSolver<ValueType>>& minMaxSolver, storm::solver::MinMaxLinearEquationSolverFactory<ValueType> const& minMaxLinearEquationSolverFactory, ValueType const& precision, boost::optional<ValueType> const& lowerBound, boost::optional<ValueType> const& upperBound) {
                // Update some data for the case that the Matrix has changed
                if (epochModel.epochMatrixChanged) {
@ -146,14 +146,13 @@ namespace storm {
                    minMaxSolver->setCachingEnabled(true);
                    minMaxSolver->setTrackScheduler(true);
                    auto req = minMaxSolver->getRequirements(dir);
                    minMaxSolver->setLowerBound(storm::utility::zero<ValueType>());
                    req.clearLowerBounds();
                    if (type == SolutionType::UntilProbabilities) {
                        minMaxSolver->setUpperBound(storm::utility::one<ValueType>());
                    if (lowerBound) {
                        minMaxSolver->setLowerBound(lowerBound.get());
                        req.clearLowerBounds();
                    }
                    if (upperBound) {
                        minMaxSolver->setUpperBound(upperBound.get());
                        req.clearUpperBounds();
                    } else if (type == SolutionType::ExpectedRewards) {
                        // TODO
                        STORM_LOG_WARN_COND(!req.requiresUpperBounds(), "Upper bounds for expected reward are not specified.");
                    }
                    STORM_LOG_THROW(req.empty(), storm::exceptions::UncheckedRequirementException, "At least one requirement was not checked.");
                    minMaxSolver->setRequirementsChecked();
@ -182,8 +181,14 @@ namespace storm {
            }
            template<typename ValueType>
            std::map<storm::storage::sparse::state_type, ValueType> SparseMdpPrctlHelper<ValueType>::computeRewardBoundedValues(SolutionType const& type, OptimizationDirection dir, rewardbounded::MultiDimensionalRewardUnfolding<ValueType, true>& rewardUnfolding, storm::storage::BitVector const& initialStates, storm::solver::MinMaxLinearEquationSolverFactory<ValueType> const& minMaxLinearEquationSolverFactory) {
            std::map<storm::storage::sparse::state_type, ValueType> SparseMdpPrctlHelper<ValueType>::computeRewardBoundedValues(OptimizationDirection dir, rewardbounded::MultiDimensionalRewardUnfolding<ValueType, true>& rewardUnfolding, storm::storage::BitVector const& initialStates, storm::solver::MinMaxLinearEquationSolverFactory<ValueType> const& minMaxLinearEquationSolverFactory) {
                storm::utility::Stopwatch swAll(true), swBuild, swCheck;
                // Get lower and upper bounds for the solution.
                auto lowerBound = rewardUnfolding.getLowerObjectiveBound();
                auto upperBound = rewardUnfolding.getUpperObjectiveBound();
                // Initialize epoch models
                auto initEpoch = rewardUnfolding.getStartEpoch();
                auto epochOrder = rewardUnfolding.getEpochComputationOrder(initEpoch);
@ -205,7 +210,7 @@ namespace storm {
                    if (epochModel.epochMatrix.getEntryCount() == 0) {
                        rewardUnfolding.setSolutionForCurrentEpoch(analyzeTrivialEpochModel<ValueType>(dir, epochModel));
                    } else {
                        rewardUnfolding.setSolutionForCurrentEpoch(analyzeNonTrivialEpochModel<ValueType>(dir, epochModel, x, b, minMaxSolver, minMaxLinearEquationSolverFactory, precision, type));
                        rewardUnfolding.setSolutionForCurrentEpoch(analyzeNonTrivialEpochModel<ValueType>(dir, epochModel, x, b, minMaxSolver, minMaxLinearEquationSolverFactory, precision, lowerBound, upperBound));
                    }
                    swCheck.stop();
                    ++numCheckedEpochs;
--- a/src/storm/modelchecker/prctl/helper/SparseMdpPrctlHelper.h
+++ b/src/storm/modelchecker/prctl/helper/SparseMdpPrctlHelper.h
@ -38,7 +38,7 @@ namespace storm {
                static std::vector<ValueType> computeStepBoundedUntilProbabilities(storm::solver::SolveGoal<ValueType>&& goal, storm::storage::SparseMatrix<ValueType> const& transitionMatrix, storm::storage::SparseMatrix<ValueType> const& backwardTransitions, storm::storage::BitVector const& phiStates, storm::storage::BitVector const& psiStates, uint_fast64_t stepBound, storm::solver::MinMaxLinearEquationSolverFactory<ValueType> const& minMaxLinearEquationSolverFactory, ModelCheckerHint const& hint = ModelCheckerHint());
                static std::map<storm::storage::sparse::state_type, ValueType> computeRewardBoundedValues(SolutionType const& type, OptimizationDirection dir, rewardbounded::MultiDimensionalRewardUnfolding<ValueType, true>& rewardUnfolding, storm::storage::BitVector const& initialStates, storm::solver::MinMaxLinearEquationSolverFactory<ValueType> const& minMaxLinearEquationSolverFactory);
                static std::map<storm::storage::sparse::state_type, ValueType> computeRewardBoundedValues(OptimizationDirection dir, rewardbounded::MultiDimensionalRewardUnfolding<ValueType, true>& rewardUnfolding, storm::storage::BitVector const& initialStates, storm::solver::MinMaxLinearEquationSolverFactory<ValueType> const& minMaxLinearEquationSolverFactory);
                static std::vector<ValueType> computeNextProbabilities(OptimizationDirection dir, storm::storage::SparseMatrix<ValueType> const& transitionMatrix, storm::storage::BitVector const& nextStates, storm::solver::MinMaxLinearEquationSolverFactory<ValueType> const& minMaxLinearEquationSolverFactory);
--- a/src/storm/modelchecker/prctl/helper/rewardbounded/MultiDimensionalRewardUnfolding.cpp
+++ b/src/storm/modelchecker/prctl/helper/rewardbounded/MultiDimensionalRewardUnfolding.cpp
@ -9,6 +9,8 @@
 #include "storm/modelchecker/propositional/SparsePropositionalModelChecker.h"
 #include "storm/modelchecker/results/ExplicitQualitativeCheckResult.h"
 #include "storm/modelchecker/prctl/helper/BaierUpperRewardBoundsComputer.h"
 #include "storm/transformer/EndComponentEliminator.h"
 #include "storm/exceptions/UnexpectedException.h"
@ -548,6 +550,103 @@ namespace storm {
                    return precision / storm::utility::convertNumber<ValueType>(sumOfDimensions);
                }
                template<typename ValueType, bool SingleObjectiveMode>
                boost::optional<ValueType> MultiDimensionalRewardUnfolding<ValueType, SingleObjectiveMode>::getUpperObjectiveBound(uint64_t objectiveIndex) {
                    auto& objective = this->objectives[objectiveIndex];
                    if (!objective.upperResultBound) {
                        if (objective.formula->isProbabilityOperatorFormula()) {
                            objective.upperResultBound = storm::utility::one<ValueType>();
                        } else if (objective.formula->isRewardOperatorFormula()) {
                            auto const& rewModel = this->model.getRewardModel(objective.formula->asRewardOperatorFormula().getRewardModelName());
                            auto actionRewards = rewModel.getTotalRewardVector(this->model.getTransitionMatrix());
                            if (objective.formula->getSubformula().isCumulativeRewardFormula()) {
                                // Try to get an upper bound by computing the maximal reward achievable within one epoch step
                                auto const& cumulativeRewardFormula = objective.formula->getSubformula().asCumulativeRewardFormula();
                                ValueType rewardBound = cumulativeRewardFormula.template getBound<ValueType>();
                                if (cumulativeRewardFormula.getTimeBoundReference().isRewardBound()) {
                                    auto const& costModel = this->model.getRewardModel(cumulativeRewardFormula.getTimeBoundReference().getRewardName());
                                    if (!costModel.hasTransitionRewards()) {
                                        auto actionCosts = costModel.getTotalRewardVector(this->model.getTransitionMatrix());
                                        ValueType largestRewardPerCost = storm::utility::zero<ValueType>();
                                        bool isFinite = true;
                                        for (auto rewIt = actionRewards.begin(), costIt = actionCosts.begin(); rewIt != actionRewards.end(); ++rewIt, ++costIt) {
                                            if (!storm::utility::isZero(*rewIt)) {
                                                if (storm::utility::isZero(*costIt)) {
                                                    isFinite = false;
                                                    break;
                                                }
                                                ValueType rewardPerCost = *rewIt / *costIt;
                                                largestRewardPerCost = std::max(largestRewardPerCost, rewardPerCost);
                                            }
                                        }
                                        if (isFinite) {
                                            objective.upperResultBound = largestRewardPerCost * rewardBound;
                                        }
                                    }
                                } else {
                                    objective.upperResultBound = (*std::max_element(actionRewards.begin(), actionRewards.end())) * rewardBound;
                                }
                                // If we could not find an upper bound, try to get an upper bound for the unbounded case
                                if (!objective.upperResultBound) {
                                    storm::storage::BitVector allStates(model.getNumberOfStates(), true);
                                    // Get the set of states from which reward is reachable
                                    auto nonZeroRewardStates = rewModel.getStatesWithZeroReward(model.getTransitionMatrix());
                                    nonZeroRewardStates.complement();
                                    auto expRewGreater0EStates = storm::utility::graph::performProbGreater0E(model.getBackwardTransitions(), allStates, nonZeroRewardStates);
                                    // Eliminate zero-reward ECs
                                    auto zeroRewardChoices = rewModel.getChoicesWithZeroReward(model.getTransitionMatrix());
                                    auto ecElimRes = storm::transformer::EndComponentEliminator<ValueType>::transform(model.getTransitionMatrix(), expRewGreater0EStates, zeroRewardChoices, ~allStates);
                                    allStates.resize(ecElimRes.matrix.getRowGroupCount());
                                    storm::storage::BitVector outStates(allStates.size(), false);
                                    std::vector<ValueType> rew0StateProbs;
                                    rew0StateProbs.reserve(ecElimRes.matrix.getRowCount());
                                    for (uint64_t state = 0; state < allStates.size(); ++ state) {
                                        for (uint64_t choice = ecElimRes.matrix.getRowGroupIndices()[state]; choice < ecElimRes.matrix.getRowGroupIndices()[state + 1]; ++choice) {
                                            // Check whether the choice lead to a state with expRew 0 in the original model
                                            bool isOutChoice = false;
                                            uint64_t originalModelChoice = ecElimRes.newToOldRowMapping[choice];
                                            for (auto const& entry : model.getTransitionMatrix().getRow(originalModelChoice)) {
                                                if (!expRewGreater0EStates.get(entry.getColumn())) {
                                                    isOutChoice = true;
                                                    outStates.set(state, true);
                                                    rew0StateProbs.push_back(storm::utility::one<ValueType>() - ecElimRes.matrix.getRowSum(choice));
                                                    assert (!storm::utility::isZero(rew0StateProbs.back()));
                                                    break;
                                                }
                                            }
                                            if (!isOutChoice) {
                                                rew0StateProbs.push_back(storm::utility::zero<ValueType>());
                                            }
                                        }
                                    }
                                    // An upper reward bound can only be computed if it is below infinity
                                    if (storm::utility::graph::performProb1A(ecElimRes.matrix, ecElimRes.matrix.getRowGroupIndices(), ecElimRes.matrix.transpose(true), allStates, outStates).full()) {
                                        std::vector<ValueType> rewards;
                                        rewards.reserve(ecElimRes.matrix.getRowCount());
                                        for (auto row : ecElimRes.newToOldRowMapping) {
                                            rewards.push_back(actionRewards[row]);
                                        }
                                        storm::modelchecker::helper::BaierUpperRewardBoundsComputer<ValueType> baier(ecElimRes.matrix, rewards, rew0StateProbs);
                                        objective.upperResultBound = baier.computeUpperBound();
                                    }
                                }
                            }
                        }
                    }
                    return objective.upperResultBound;
                }
                template<typename ValueType, bool SingleObjectiveMode>
                boost::optional<ValueType> MultiDimensionalRewardUnfolding<ValueType, SingleObjectiveMode>::getLowerObjectiveBound(uint64_t objectiveIndex) {
                    auto& objective = this->objectives[objectiveIndex];
                    if (!objective.lowerResultBound) {
                        objective.lowerResultBound = storm::utility::zero<ValueType>();
                    }
                    return objective.lowerResultBound;
                }
                template<typename ValueType, bool SingleObjectiveMode>
                void MultiDimensionalRewardUnfolding<ValueType, SingleObjectiveMode>::setSolutionForCurrentEpoch(std::vector<SolutionType>&& inStateSolutions) {
                    STORM_LOG_ASSERT(currentEpoch, "Tried to set a solution for the current epoch, but no epoch was specified before.");
--- a/src/storm/modelchecker/prctl/helper/rewardbounded/MultiDimensionalRewardUnfolding.h
+++ b/src/storm/modelchecker/prctl/helper/rewardbounded/MultiDimensionalRewardUnfolding.h
@ -58,6 +58,12 @@ namespace storm {
                     */
                    ValueType getRequiredEpochModelPrecision(Epoch const& startEpoch, ValueType const& precision);
                    /*!
                     * Returns an upper/lower bound for the objective result in every state (if this bound could be computed)
                     */
                    boost::optional<ValueType> getUpperObjectiveBound(uint64_t objectiveIndex = 0);
                    boost::optional<ValueType> getLowerObjectiveBound(uint64_t objectiveIndex = 0);
                    void setSolutionForCurrentEpoch(std::vector<SolutionType>&& inStateSolutions);
                    SolutionType const& getInitialStateResult(Epoch const& epoch); // Assumes that the initial state is unique
                    SolutionType const& getInitialStateResult(Epoch const& epoch, uint64_t initialStateIndex);