Added timing and caching of subsimplex computation results

7 years ago · 3bd910f42b
5 changed files with 117 additions and 41 deletions
--- a/src/storm-pomdp-cli/settings/modules/POMDPSettings.cpp
+++ b/src/storm-pomdp-cli/settings/modules/POMDPSettings.cpp
@ -14,6 +14,7 @@ namespace storm {
            
            const std::string POMDPSettings::moduleName = "pomdp";
            const std::string exportAsParametricModelOption = "parametric-drn";
+            const std::string gridApproximationOption = "gridapproximation";
            const std::string qualitativeReductionOption = "qualitativereduction";
            const std::string analyzeUniqueObservationsOption = "uniqueobservations";
            const std::string mecReductionOption = "mecreduction";
@ -37,6 +38,13 @@ namespace storm {
                this->addOption(storm::settings::OptionBuilder(moduleName, fscmode, false, "Sets the way the pMC is obtained").addArgument(storm::settings::ArgumentBuilder::createStringArgument("type", "type name").addValidatorString(ArgumentValidatorFactory::createMultipleChoiceValidator(fscModes)).setDefaultValueString("standard").build()).build());
                this->addOption(storm::settings::OptionBuilder(moduleName, transformBinaryOption, false, "Transforms the pomdp to a binary pomdp.").build());
                this->addOption(storm::settings::OptionBuilder(moduleName, transformSimpleOption, false, "Transforms the pomdp to a binary and simple pomdp.").build());
+                this->addOption(storm::settings::OptionBuilder(moduleName, gridApproximationOption, false,
+                                                               "Analyze the POMDP using grid approximation.").addArgument(
+                        storm::settings::ArgumentBuilder::createUnsignedIntegerArgument("resolution",
+                                                                                        "the resolution of the grid").setDefaultValueUnsignedInteger(
+                                10).addValidatorUnsignedInteger(
+                                storm::settings::ArgumentValidatorFactory::createUnsignedGreaterValidator(
+                                        0)).build()).build());
            }

            bool POMDPSettings::isExportToParametricSet() const {
@ -62,6 +70,15 @@ namespace storm {
            bool POMDPSettings::isSelfloopReductionSet() const {
                return this->getOption(selfloopReductionOption).getHasOptionBeenSet();
            }
+
+            bool POMDPSettings::isGridApproximationSet() const {
+                return this->getOption(gridApproximationOption).getHasOptionBeenSet();
+            }
+
+            uint64_t POMDPSettings::getGridResolution() const {
+                return this->getOption(gridApproximationOption).getArgumentByName(
+                        "resolution").getValueAsUnsignedInteger();
+            }
            
            uint64_t POMDPSettings::getMemoryBound() const {
                return this->getOption(memoryBoundOption).getArgumentByName("bound").getValueAsUnsignedInteger();
--- a/src/storm-pomdp-cli/settings/modules/POMDPSettings.h
+++ b/src/storm-pomdp-cli/settings/modules/POMDPSettings.h
@ -25,6 +25,8 @@ namespace storm {
                std::string getExportToParametricFilename() const;
                
                bool isQualitativeReductionSet() const;
+
+                bool isGridApproximationSet() const;
                bool isAnalyzeUniqueObservationsSet() const;
                bool isMecReductionSet() const;
                bool isSelfloopReductionSet() const;
@ -32,6 +34,8 @@ namespace storm {
                bool isTransformBinarySet() const;
                std::string getFscApplicationTypeString() const;
                uint64_t getMemoryBound() const;
+
+                uint64_t getGridResolution() const;
                storm::storage::PomdpMemoryPattern getMemoryPattern() const;
                
                bool check() const override;
--- a/src/storm-pomdp-cli/storm-pomdp.cpp
+++ b/src/storm-pomdp-cli/storm-pomdp.cpp
@ -42,6 +42,8 @@
 #include "storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.h"
 #include "storm/api/storm.h"

+#include <typeinfo>
+
 /*!
 * Initialize the settings manager.
 */
@ -113,10 +115,6 @@ int main(const int argc, const char** argv) {
        STORM_LOG_THROW(model && model->getType() == storm::models::ModelType::Pomdp, storm::exceptions::WrongFormatException, "Expected a POMDP.");
        std::shared_ptr<storm::models::sparse::Pomdp<storm::RationalNumber>> pomdp = model->template as<storm::models::sparse::Pomdp<storm::RationalNumber>>();

-        // For ease of testing
-        storm::pomdp::modelchecker::ApproximatePOMDPModelchecker<storm::RationalNumber> checker = storm::pomdp::modelchecker::ApproximatePOMDPModelchecker<storm::RationalNumber>();
-        checker.computeReachabilityProbability(*pomdp, std::set<uint32_t>({7}), false, 10);
-
        std::shared_ptr<storm::logic::Formula const> formula;
        if (!symbolicInput.properties.empty()) {
            formula = symbolicInput.properties.front().getRawFormula();
@ -149,6 +147,42 @@ int main(const int argc, const char** argv) {
                    STORM_PRINT_AND_LOG(" done." << std::endl);
                    std::cout << "actual reduction not yet implemented..." << std::endl;
                }
+                if (pomdpSettings.isGridApproximationSet()) {
+                    storm::logic::ProbabilityOperatorFormula const &probFormula = formula->asProbabilityOperatorFormula();
+                    storm::logic::Formula const &subformula1 = probFormula.getSubformula();
+
+                    std::set<uint32_t> targetObservationSet;
+                    //TODO refactor
+                    bool validFormula = false;
+                    if (subformula1.isEventuallyFormula()) {
+                        storm::logic::EventuallyFormula const &eventuallyFormula = subformula1.asEventuallyFormula();
+                        storm::logic::Formula const &subformula2 = eventuallyFormula.getSubformula();
+                        if (subformula2.isAtomicLabelFormula()) {
+                            storm::logic::AtomicLabelFormula const &alFormula = subformula2.asAtomicLabelFormula();
+                            validFormula = true;
+                            std::string targetLabel = alFormula.getLabel();
+                            auto labeling = pomdp->getStateLabeling();
+                            for (size_t state = 0; state < pomdp->getNumberOfStates(); ++state) {
+                                if (labeling.getStateHasLabel(targetLabel, state)) {
+                                    targetObservationSet.insert(pomdp->getObservation(state));
+                                }
+                            }
+                        }
+                    }
+                    STORM_LOG_THROW(validFormula, storm::exceptions::InvalidPropertyException,
+                                    "The formula is not supported by the grid approximation");
+
+                    storm::pomdp::modelchecker::ApproximatePOMDPModelchecker<storm::RationalNumber> checker = storm::pomdp::modelchecker::ApproximatePOMDPModelchecker<storm::RationalNumber>();
+                    storm::RationalNumber overRes = storm::utility::one<storm::RationalNumber>();
+                    storm::RationalNumber underRes = storm::utility::zero<storm::RationalNumber>();
+                    std::unique_ptr<storm::pomdp::modelchecker::POMDPCheckResult<storm::RationalNumber>> result;
+                    result = checker.computeReachabilityProbability(*pomdp, targetObservationSet,
+                                                                    probFormula.getOptimalityType() ==
+                                                                    storm::OptimizationDirection::Minimize,
+                                                                    pomdpSettings.getGridResolution() + gridIncrease);
+                    overRes = result->OverapproximationValue;
+                    underRes = result->UnderapproximationValue;
+                }
            } else if (formula->isRewardOperatorFormula()) {
                if (pomdpSettings.isSelfloopReductionSet() && storm::solver::minimize(formula->asRewardOperatorFormula().getOptimalityType())) {
                    STORM_PRINT_AND_LOG("Eliminating self-loop choices ...");
--- a/src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.cpp
+++ b/src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.cpp
@ -22,11 +22,11 @@ namespace storm {
            }

            template<typename ValueType, typename RewardModelType>
-            /*std::unique_ptr<POMDPCheckResult>*/ void
+            std::unique_ptr<POMDPCheckResult<ValueType>>
            ApproximatePOMDPModelchecker<ValueType, RewardModelType>::computeReachabilityProbability(
                    storm::models::sparse::Pomdp<ValueType, RewardModelType> const &pomdp,
                    std::set<uint32_t> targetObservations, bool min, uint64_t gridResolution) {
-                //TODO add timing
+                storm::utility::Stopwatch beliefGridTimer(true);
                uint64_t maxIterations = 100;
                bool finished = false;
                uint64_t iteration = 0;
@ -46,7 +46,9 @@ namespace storm {
                constructBeliefGrid(pomdp, targetObservations, gridResolution, beliefList, beliefGrid, beliefIsTarget,
                                    nextId);
                nextId = beliefList.size();
+                beliefGridTimer.stop();

+                storm::utility::Stopwatch overApproxTimer(true);
                // ID -> Value
                std::map<uint64_t, ValueType> result;
                std::map<uint64_t, ValueType> result_backup;
@ -58,6 +60,7 @@ namespace storm {
                // current ID -> action -> next ID
                std::map<uint64_t, std::vector<std::map<uint32_t, uint64_t>>> nextBelieves;

+                storm::utility::Stopwatch nextBeliefGeneration(true);
                for (size_t i = 0; i < beliefGrid.size(); ++i) {
                    auto currentBelief = beliefGrid[i];
                    bool isTarget = beliefIsTarget[currentBelief.id];
@ -68,6 +71,7 @@ namespace storm {
                        result.emplace(std::make_pair(currentBelief.id, storm::utility::zero<ValueType>()));
                        result_backup.emplace(std::make_pair(currentBelief.id, storm::utility::zero<ValueType>()));

+                        //TODO put this in extra function
                        std::vector<std::map<uint32_t, ValueType>> observationProbabilitiesInAction;
                        std::vector<std::map<uint32_t, uint64_t>> nextBelievesInAction;

@ -98,9 +102,17 @@ namespace storm {
                        nextBelieves.emplace(std::make_pair(currentBelief.id, nextBelievesInAction));
                    }
                }
+                nextBeliefGeneration.stop();
+
+                //Use chaching to avoid multiple computation of the subsimplices and lambdas
+                std::map<uint64_t, std::vector<std::vector<ValueType>>> subSimplexCache;
+                std::map<uint64_t, std::vector<ValueType>> lambdaCache;
+
+                STORM_PRINT("Time generation of next believes: " << nextBeliefGeneration << std::endl)
                // Value Iteration
                auto cc = storm::utility::ConstantsComparator<ValueType>();
                while (!finished && iteration < maxIterations) {
+                    storm::utility::Stopwatch iterationTimer(true);
                    STORM_LOG_DEBUG("Iteration " << iteration + 1);
                    bool improvement = false;
                    for (size_t i = 0; i < beliefGrid.size(); ++i) {
@ -123,10 +135,20 @@ namespace storm {
                                    uint32_t observation = iter->first;
                                    storm::pomdp::Belief<ValueType> nextBelief = beliefList[nextBelieves[currentBelief.id][action][observation]];
                                    // compute subsimplex and lambdas according to the Lovejoy paper to approximate the next belief
-                                    std::pair<std::vector<std::vector<ValueType>>, std::vector<ValueType>> temp = computeSubSimplexAndLambdas(
-                                            nextBelief.probabilities, gridResolution);
-                                    std::vector<std::vector<ValueType>> subSimplex = temp.first;
-                                    std::vector<ValueType> lambdas = temp.second;
+                                    // cache the values  to not always re-calculate
+                                    std::vector<std::vector<ValueType>> subSimplex;
+                                    std::vector<ValueType> lambdas;
+                                    if (subSimplexCache.count(nextBelief.id) > 0) {
+                                        subSimplex = subSimplexCache[nextBelief.id];
+                                        lambdas = lambdaCache[nextBelief.id];
+                                    } else {
+                                        std::pair<std::vector<std::vector<ValueType>>, std::vector<ValueType>> temp = computeSubSimplexAndLambdas(
+                                                nextBelief.probabilities, gridResolution);
+                                        subSimplex = temp.first;
+                                        lambdas = temp.second;
+                                        subSimplexCache[nextBelief.id] = subSimplex;
+                                        lambdaCache[nextBelief.id] = lambdas;
+                                    }

                                    auto sum = storm::utility::zero<ValueType>();
                                    for (size_t j = 0; j < lambdas.size(); ++j) {
@ -138,17 +160,11 @@ namespace storm {
                                    currentValue += iter->second * sum;
                                }

-                                // Update the selected actions TODO make this nicer
+                                // Update the selected actions
                                if ((min && cc.isLess(storm::utility::zero<ValueType>(), chosenValue - currentValue)) ||
                                    (!min &&
-                                     cc.isLess(storm::utility::zero<ValueType>(), currentValue - chosenValue))) {
-                                    chosenValue = currentValue;
-                                    chosenActionIndex = action;
-                                } else if ((min && cc.isEqual(storm::utility::zero<ValueType>(),
-                                                              chosenValue - currentValue)) ||
-                                           (!min &&
-                                            cc.isEqual(storm::utility::zero<ValueType>(),
-                                                       currentValue - chosenValue))) {
+                                     cc.isLess(storm::utility::zero<ValueType>(), currentValue - chosenValue)) ||
+                                    cc.isEqual(storm::utility::zero<ValueType>(), chosenValue - currentValue)) {
                                    chosenValue = currentValue;
                                    chosenActionIndex = action;
                                }
@ -171,9 +187,11 @@ namespace storm {
                        result_backup[iter->first] = result[iter->first];
                    }
                    ++iteration;
+                    iterationTimer.stop();
+                    STORM_PRINT("Iteration " << iteration << ": " << iterationTimer << std::endl);
                }

-                STORM_PRINT("Grid approximation took " << iteration << " iterations" << std::endl);
+                STORM_PRINT("Overapproximation took " << iteration << " iterations" << std::endl);

                beliefGrid.push_back(initialBelief);
                beliefIsTarget.push_back(
@ -192,9 +210,10 @@ namespace storm {
                                                                        initSubSimplex[j])];
                    }
                }
+                overApproxTimer.stop();

                // Now onto the under-approximation
-
+                storm::utility::Stopwatch underApproxTimer(true);
                std::set<uint64_t> visitedBelieves;
                std::deque<uint64_t> believesToBeExpanded;
                std::map<uint64_t, uint64_t> beliefStateMap;
@ -243,12 +262,6 @@ namespace storm {
                    believesToBeExpanded.pop_front();
                }

-                for (size_t i = 0; i < transitions.size(); ++i) {
-                    for (auto const &transition : transitions[i]) {
-                        STORM_LOG_DEBUG(
-                                "Transition: " << i << " -- " << transition.second << "--> " << transition.first);
-                    }
-                }
                storm::models::sparse::StateLabeling labeling(transitions.size());
                labeling.addLabel("init");
                labeling.addLabel("target");
@ -276,8 +289,17 @@ namespace storm {
                ValueType resultValue = res->asExplicitQuantitativeCheckResult<ValueType>().getValueMap().begin()->second;


+                STORM_PRINT("Time Belief Grid Generation: " << beliefGridTimer << std::endl
+                                                            << "Time Overapproximation: " << overApproxTimer
+                                                            << std::endl
+                                                            << "Time Underapproximation: " << underApproxTimer
+                                                            << std::endl);
+
                STORM_PRINT("Over-Approximation Result: " << overApprox << std::endl);
                STORM_PRINT("Under-Approximation Result: " << resultValue << std::endl);
+
+                return std::make_unique<POMDPCheckResult<ValueType>>(
+                        POMDPCheckResult<ValueType>{overApprox, resultValue});
            }

            template<typename ValueType, typename RewardModelType>
@ -311,9 +333,10 @@ namespace storm {
                    uint64_t gridResolution, uint64_t currentBeliefId, uint64_t nextId, bool min) {
                auto cc = storm::utility::ConstantsComparator<ValueType>();
                storm::pomdp::Belief<ValueType> currentBelief = beliefList[currentBeliefId];
+
+                //TODO put this in extra function
                std::vector<std::map<uint32_t, ValueType>> observationProbabilitiesInAction;
                std::vector<std::map<uint32_t, uint64_t>> nextBelievesInAction;
-
                uint64_t numChoices = pomdp.getNumberOfChoices(
                        pomdp.getStatesWithObservation(currentBelief.observation).front());
                for (uint64_t action = 0; action < numChoices; ++action) {
@ -354,8 +377,7 @@ namespace storm {
                        storm::pomdp::Belief<ValueType> nextBelief = beliefList[nextBelieves[currentBelief.id][action][observation]];

                        // compute subsimplex and lambdas according to the Lovejoy paper to approximate the next belief
-                        auto temp = computeSubSimplexAndLambdas(
-                                nextBelief.probabilities, gridResolution);
+                        auto temp = computeSubSimplexAndLambdas(nextBelief.probabilities, gridResolution);
                        std::vector<std::vector<ValueType>> subSimplex = temp.first;
                        std::vector<ValueType> lambdas = temp.second;

@ -369,15 +391,11 @@ namespace storm {
                        currentValue += iter->second * sum;
                    }

-                    // Update the selected actions TODO make this nicer
+                    // Update the selected actions
                    if ((min && cc.isLess(storm::utility::zero<ValueType>(), chosenValue - currentValue)) ||
                        (!min &&
-                         cc.isLess(storm::utility::zero<ValueType>(), currentValue - chosenValue))) {
-                        chosenValue = currentValue;
-                        chosenActionIndex = action;
-                    } else if ((min && cc.isEqual(storm::utility::zero<ValueType>(), chosenValue - currentValue)) ||
-                               (!min &&
-                                cc.isEqual(storm::utility::zero<ValueType>(), currentValue - chosenValue))) {
+                         cc.isLess(storm::utility::zero<ValueType>(), currentValue - chosenValue)) ||
+                        cc.isEqual(storm::utility::zero<ValueType>(), chosenValue - currentValue)) {
                        chosenValue = currentValue;
                        chosenActionIndex = action;
                    }
@ -561,7 +579,6 @@ namespace storm {
                }
                lambdas[0] = storm::utility::one<ValueType>() - sum;

-                //TODO add assertion that we are close enough
                return std::make_pair(subSimplex, lambdas);
            }

--- a/src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.h
+++ b/src/storm-pomdp/modelchecker/ApproximatePOMDPModelchecker.h
@ -9,19 +9,23 @@
 namespace storm {
    namespace pomdp {
        namespace modelchecker {
-            class POMDPCheckResult;
+            template<class ValueType>
+            struct POMDPCheckResult {
+                ValueType OverapproximationValue;
+                ValueType UnderapproximationValue;
+            };

            template<class ValueType, typename RewardModelType = models::sparse::StandardRewardModel<ValueType>>
            class ApproximatePOMDPModelchecker {
            public:
                explicit ApproximatePOMDPModelchecker();

-                /*std::unique_ptr<POMDPCheckResult>*/ void
+                std::unique_ptr<POMDPCheckResult<ValueType>>
                computeReachabilityProbability(storm::models::sparse::Pomdp<ValueType, RewardModelType> const &pomdp,
                                               std::set<uint32_t> targetObservations, bool min,
                                               uint64_t gridResolution);

-                std::unique_ptr<POMDPCheckResult>
+                std::unique_ptr<POMDPCheckResult<ValueType>>
                computeReachabilityReward(storm::models::sparse::Pomdp<ValueType, RewardModelType> const &pomdp,
                                          std::set<uint32_t> target_observations, uint64_t gridResolution);